arm_neon.h (2788713B) - Raw
1 /*===---- arm_neon.h - ARM Neon intrinsics ---------------------------------=== 2 * 3 * Permission is hereby granted, free of charge, to any person obtaining a copy 4 * of this software and associated documentation files (the "Software"), to deal 5 * in the Software without restriction, including without limitation the rights 6 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 7 * copies of the Software, and to permit persons to whom the Software is 8 * furnished to do so, subject to the following conditions: 9 * 10 * The above copyright notice and this permission notice shall be included in 11 * all copies or substantial portions of the Software. 12 * 13 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 14 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 15 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE 16 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 17 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 18 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN 19 * THE SOFTWARE. 20 * 21 *===-----------------------------------------------------------------------=== 22 */ 23 24 #ifndef __ARM_NEON_H 25 #define __ARM_NEON_H 26 27 #ifndef __ARM_FP 28 #error "NEON intrinsics not available with the soft-float ABI. Please use -mfloat-abi=softfp or -mfloat-abi=hard" 29 #else 30 31 #include <stdint.h> 32 33 #include <arm_bf16.h> 34 #include <arm_vector_types.h> 35 #if defined(__aarch64__) || defined(__arm64ec__) 36 typedef uint8_t poly8_t; 37 typedef uint16_t poly16_t; 38 typedef uint64_t poly64_t; 39 typedef __uint128_t poly128_t; 40 #else 41 typedef int8_t poly8_t; 42 typedef int16_t poly16_t; 43 typedef int64_t poly64_t; 44 #endif 45 typedef __attribute__((neon_polyvector_type(8))) poly8_t poly8x8_t; 46 typedef __attribute__((neon_polyvector_type(16))) poly8_t poly8x16_t; 47 typedef __attribute__((neon_polyvector_type(4))) poly16_t poly16x4_t; 48 typedef __attribute__((neon_polyvector_type(8))) poly16_t poly16x8_t; 49 typedef __attribute__((neon_polyvector_type(1))) poly64_t poly64x1_t; 50 typedef __attribute__((neon_polyvector_type(2))) poly64_t poly64x2_t; 51 52 typedef struct poly8x8x2_t { 53 poly8x8_t val[2]; 54 } poly8x8x2_t; 55 56 typedef struct poly8x16x2_t { 57 poly8x16_t val[2]; 58 } poly8x16x2_t; 59 60 typedef struct poly16x4x2_t { 61 poly16x4_t val[2]; 62 } poly16x4x2_t; 63 64 typedef struct poly16x8x2_t { 65 poly16x8_t val[2]; 66 } poly16x8x2_t; 67 68 typedef struct poly64x1x2_t { 69 poly64x1_t val[2]; 70 } poly64x1x2_t; 71 72 typedef struct poly64x2x2_t { 73 poly64x2_t val[2]; 74 } poly64x2x2_t; 75 76 typedef struct poly8x8x3_t { 77 poly8x8_t val[3]; 78 } poly8x8x3_t; 79 80 typedef struct poly8x16x3_t { 81 poly8x16_t val[3]; 82 } poly8x16x3_t; 83 84 typedef struct poly16x4x3_t { 85 poly16x4_t val[3]; 86 } poly16x4x3_t; 87 88 typedef struct poly16x8x3_t { 89 poly16x8_t val[3]; 90 } poly16x8x3_t; 91 92 typedef struct poly64x1x3_t { 93 poly64x1_t val[3]; 94 } poly64x1x3_t; 95 96 typedef struct poly64x2x3_t { 97 poly64x2_t val[3]; 98 } poly64x2x3_t; 99 100 typedef struct poly8x8x4_t { 101 poly8x8_t val[4]; 102 } poly8x8x4_t; 103 104 typedef struct poly8x16x4_t { 105 poly8x16_t val[4]; 106 } poly8x16x4_t; 107 108 typedef struct poly16x4x4_t { 109 poly16x4_t val[4]; 110 } poly16x4x4_t; 111 112 typedef struct poly16x8x4_t { 113 poly16x8_t val[4]; 114 } poly16x8x4_t; 115 116 typedef struct poly64x1x4_t { 117 poly64x1_t val[4]; 118 } poly64x1x4_t; 119 120 typedef struct poly64x2x4_t { 121 poly64x2_t val[4]; 122 } poly64x2x4_t; 123 124 #define __ai static __inline__ __attribute__((__always_inline__, __nodebug__)) 125 126 #ifdef __LITTLE_ENDIAN__ 127 #define splatq_lane_bf16(__p0, __p1) __extension__ ({ \ 128 bfloat16x8_t __ret; \ 129 bfloat16x4_t __s0 = __p0; \ 130 __ret = (bfloat16x8_t) __builtin_neon_splatq_lane_bf16((int8x8_t)__s0, __p1, 11); \ 131 __ret; \ 132 }) 133 #else 134 #define splatq_lane_bf16(__p0, __p1) __extension__ ({ \ 135 bfloat16x8_t __ret; \ 136 bfloat16x4_t __s0 = __p0; \ 137 bfloat16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 138 __ret = (bfloat16x8_t) __builtin_neon_splatq_lane_bf16((int8x8_t)__rev0, __p1, 11); \ 139 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 140 __ret; \ 141 }) 142 #define __noswap_splatq_lane_bf16(__p0, __p1) __extension__ ({ \ 143 bfloat16x8_t __ret; \ 144 bfloat16x4_t __s0 = __p0; \ 145 __ret = (bfloat16x8_t) __builtin_neon_splatq_lane_bf16((int8x8_t)__s0, __p1, 11); \ 146 __ret; \ 147 }) 148 #endif 149 150 #ifdef __LITTLE_ENDIAN__ 151 #define splat_lane_bf16(__p0, __p1) __extension__ ({ \ 152 bfloat16x4_t __ret; \ 153 bfloat16x4_t __s0 = __p0; \ 154 __ret = (bfloat16x4_t) __builtin_neon_splat_lane_bf16((int8x8_t)__s0, __p1, 11); \ 155 __ret; \ 156 }) 157 #else 158 #define splat_lane_bf16(__p0, __p1) __extension__ ({ \ 159 bfloat16x4_t __ret; \ 160 bfloat16x4_t __s0 = __p0; \ 161 bfloat16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 162 __ret = (bfloat16x4_t) __builtin_neon_splat_lane_bf16((int8x8_t)__rev0, __p1, 11); \ 163 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 164 __ret; \ 165 }) 166 #define __noswap_splat_lane_bf16(__p0, __p1) __extension__ ({ \ 167 bfloat16x4_t __ret; \ 168 bfloat16x4_t __s0 = __p0; \ 169 __ret = (bfloat16x4_t) __builtin_neon_splat_lane_bf16((int8x8_t)__s0, __p1, 11); \ 170 __ret; \ 171 }) 172 #endif 173 174 #ifdef __LITTLE_ENDIAN__ 175 #define splatq_laneq_bf16(__p0, __p1) __extension__ ({ \ 176 bfloat16x8_t __ret; \ 177 bfloat16x8_t __s0 = __p0; \ 178 __ret = (bfloat16x8_t) __builtin_neon_splatq_laneq_bf16((int8x16_t)__s0, __p1, 43); \ 179 __ret; \ 180 }) 181 #else 182 #define splatq_laneq_bf16(__p0, __p1) __extension__ ({ \ 183 bfloat16x8_t __ret; \ 184 bfloat16x8_t __s0 = __p0; \ 185 bfloat16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 186 __ret = (bfloat16x8_t) __builtin_neon_splatq_laneq_bf16((int8x16_t)__rev0, __p1, 43); \ 187 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 188 __ret; \ 189 }) 190 #define __noswap_splatq_laneq_bf16(__p0, __p1) __extension__ ({ \ 191 bfloat16x8_t __ret; \ 192 bfloat16x8_t __s0 = __p0; \ 193 __ret = (bfloat16x8_t) __builtin_neon_splatq_laneq_bf16((int8x16_t)__s0, __p1, 43); \ 194 __ret; \ 195 }) 196 #endif 197 198 #ifdef __LITTLE_ENDIAN__ 199 #define splat_laneq_bf16(__p0, __p1) __extension__ ({ \ 200 bfloat16x4_t __ret; \ 201 bfloat16x8_t __s0 = __p0; \ 202 __ret = (bfloat16x4_t) __builtin_neon_splat_laneq_bf16((int8x16_t)__s0, __p1, 43); \ 203 __ret; \ 204 }) 205 #else 206 #define splat_laneq_bf16(__p0, __p1) __extension__ ({ \ 207 bfloat16x4_t __ret; \ 208 bfloat16x8_t __s0 = __p0; \ 209 bfloat16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 210 __ret = (bfloat16x4_t) __builtin_neon_splat_laneq_bf16((int8x16_t)__rev0, __p1, 43); \ 211 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 212 __ret; \ 213 }) 214 #define __noswap_splat_laneq_bf16(__p0, __p1) __extension__ ({ \ 215 bfloat16x4_t __ret; \ 216 bfloat16x8_t __s0 = __p0; \ 217 __ret = (bfloat16x4_t) __builtin_neon_splat_laneq_bf16((int8x16_t)__s0, __p1, 43); \ 218 __ret; \ 219 }) 220 #endif 221 222 #ifdef __LITTLE_ENDIAN__ 223 __ai __attribute__((target("bf16,neon"))) float32x4_t vbfdotq_f32(float32x4_t __p0, bfloat16x8_t __p1, bfloat16x8_t __p2) { 224 float32x4_t __ret; 225 __ret = (float32x4_t) __builtin_neon_vbfdotq_f32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41); 226 return __ret; 227 } 228 #else 229 __ai __attribute__((target("bf16,neon"))) float32x4_t vbfdotq_f32(float32x4_t __p0, bfloat16x8_t __p1, bfloat16x8_t __p2) { 230 float32x4_t __ret; 231 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 232 bfloat16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 233 bfloat16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 234 __ret = (float32x4_t) __builtin_neon_vbfdotq_f32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 41); 235 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 236 return __ret; 237 } 238 __ai __attribute__((target("bf16,neon"))) float32x4_t __noswap_vbfdotq_f32(float32x4_t __p0, bfloat16x8_t __p1, bfloat16x8_t __p2) { 239 float32x4_t __ret; 240 __ret = (float32x4_t) __builtin_neon_vbfdotq_f32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41); 241 return __ret; 242 } 243 #endif 244 245 #ifdef __LITTLE_ENDIAN__ 246 __ai __attribute__((target("bf16,neon"))) float32x2_t vbfdot_f32(float32x2_t __p0, bfloat16x4_t __p1, bfloat16x4_t __p2) { 247 float32x2_t __ret; 248 __ret = (float32x2_t) __builtin_neon_vbfdot_f32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9); 249 return __ret; 250 } 251 #else 252 __ai __attribute__((target("bf16,neon"))) float32x2_t vbfdot_f32(float32x2_t __p0, bfloat16x4_t __p1, bfloat16x4_t __p2) { 253 float32x2_t __ret; 254 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 255 bfloat16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 256 bfloat16x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 257 __ret = (float32x2_t) __builtin_neon_vbfdot_f32((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 9); 258 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 259 return __ret; 260 } 261 __ai __attribute__((target("bf16,neon"))) float32x2_t __noswap_vbfdot_f32(float32x2_t __p0, bfloat16x4_t __p1, bfloat16x4_t __p2) { 262 float32x2_t __ret; 263 __ret = (float32x2_t) __builtin_neon_vbfdot_f32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9); 264 return __ret; 265 } 266 #endif 267 268 #ifdef __LITTLE_ENDIAN__ 269 __ai __attribute__((target("bf16,neon"))) float32x4_t vbfmlalbq_f32(float32x4_t __p0, bfloat16x8_t __p1, bfloat16x8_t __p2) { 270 float32x4_t __ret; 271 __ret = (float32x4_t) __builtin_neon_vbfmlalbq_f32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41); 272 return __ret; 273 } 274 #else 275 __ai __attribute__((target("bf16,neon"))) float32x4_t vbfmlalbq_f32(float32x4_t __p0, bfloat16x8_t __p1, bfloat16x8_t __p2) { 276 float32x4_t __ret; 277 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 278 bfloat16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 279 bfloat16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 280 __ret = (float32x4_t) __builtin_neon_vbfmlalbq_f32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 41); 281 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 282 return __ret; 283 } 284 __ai __attribute__((target("bf16,neon"))) float32x4_t __noswap_vbfmlalbq_f32(float32x4_t __p0, bfloat16x8_t __p1, bfloat16x8_t __p2) { 285 float32x4_t __ret; 286 __ret = (float32x4_t) __builtin_neon_vbfmlalbq_f32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41); 287 return __ret; 288 } 289 #endif 290 291 #ifdef __LITTLE_ENDIAN__ 292 __ai __attribute__((target("bf16,neon"))) float32x4_t vbfmlaltq_f32(float32x4_t __p0, bfloat16x8_t __p1, bfloat16x8_t __p2) { 293 float32x4_t __ret; 294 __ret = (float32x4_t) __builtin_neon_vbfmlaltq_f32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41); 295 return __ret; 296 } 297 #else 298 __ai __attribute__((target("bf16,neon"))) float32x4_t vbfmlaltq_f32(float32x4_t __p0, bfloat16x8_t __p1, bfloat16x8_t __p2) { 299 float32x4_t __ret; 300 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 301 bfloat16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 302 bfloat16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 303 __ret = (float32x4_t) __builtin_neon_vbfmlaltq_f32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 41); 304 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 305 return __ret; 306 } 307 __ai __attribute__((target("bf16,neon"))) float32x4_t __noswap_vbfmlaltq_f32(float32x4_t __p0, bfloat16x8_t __p1, bfloat16x8_t __p2) { 308 float32x4_t __ret; 309 __ret = (float32x4_t) __builtin_neon_vbfmlaltq_f32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41); 310 return __ret; 311 } 312 #endif 313 314 #ifdef __LITTLE_ENDIAN__ 315 __ai __attribute__((target("bf16,neon"))) float32x4_t vbfmmlaq_f32(float32x4_t __p0, bfloat16x8_t __p1, bfloat16x8_t __p2) { 316 float32x4_t __ret; 317 __ret = (float32x4_t) __builtin_neon_vbfmmlaq_f32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41); 318 return __ret; 319 } 320 #else 321 __ai __attribute__((target("bf16,neon"))) float32x4_t vbfmmlaq_f32(float32x4_t __p0, bfloat16x8_t __p1, bfloat16x8_t __p2) { 322 float32x4_t __ret; 323 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 324 bfloat16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 325 bfloat16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 326 __ret = (float32x4_t) __builtin_neon_vbfmmlaq_f32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 41); 327 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 328 return __ret; 329 } 330 #endif 331 332 #ifdef __LITTLE_ENDIAN__ 333 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vcombine_bf16(bfloat16x4_t __p0, bfloat16x4_t __p1) { 334 bfloat16x8_t __ret; 335 __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3, 4, 5, 6, 7); 336 return __ret; 337 } 338 #else 339 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vcombine_bf16(bfloat16x4_t __p0, bfloat16x4_t __p1) { 340 bfloat16x8_t __ret; 341 bfloat16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 342 bfloat16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 343 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 1, 2, 3, 4, 5, 6, 7); 344 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 345 return __ret; 346 } 347 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t __noswap_vcombine_bf16(bfloat16x4_t __p0, bfloat16x4_t __p1) { 348 bfloat16x8_t __ret; 349 __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3, 4, 5, 6, 7); 350 return __ret; 351 } 352 #endif 353 354 #define vcreate_bf16(__p0) __extension__ ({ \ 355 bfloat16x4_t __ret; \ 356 uint64_t __promote = __p0; \ 357 __ret = (bfloat16x4_t)(__promote); \ 358 __ret; \ 359 }) 360 __ai __attribute__((target("bf16,neon"))) float32_t vcvtah_f32_bf16(bfloat16_t __p0) { 361 float32_t __ret; 362 __ret = __builtin_bit_cast(float32_t, (uint32_t)(__builtin_bit_cast(uint16_t, __p0)) << 16); 363 return __ret; 364 } 365 __ai __attribute__((target("bf16,neon"))) bfloat16_t vcvth_bf16_f32(float32_t __p0) { 366 bfloat16_t __ret; 367 __ret = (bfloat16_t) __builtin_neon_vcvth_bf16_f32(__p0); 368 return __ret; 369 } 370 #ifdef __LITTLE_ENDIAN__ 371 #define vduph_lane_bf16(__p0, __p1) __extension__ ({ \ 372 bfloat16_t __ret; \ 373 bfloat16x4_t __s0 = __p0; \ 374 __ret = (bfloat16_t) __builtin_neon_vduph_lane_bf16((bfloat16x4_t)__s0, __p1); \ 375 __ret; \ 376 }) 377 #else 378 #define vduph_lane_bf16(__p0, __p1) __extension__ ({ \ 379 bfloat16_t __ret; \ 380 bfloat16x4_t __s0 = __p0; \ 381 bfloat16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 382 __ret = (bfloat16_t) __builtin_neon_vduph_lane_bf16((bfloat16x4_t)__rev0, __p1); \ 383 __ret; \ 384 }) 385 #endif 386 387 #ifdef __LITTLE_ENDIAN__ 388 #define vdupq_lane_bf16(__p0_0, __p1_0) __extension__ ({ \ 389 bfloat16x8_t __ret_0; \ 390 bfloat16x4_t __s0_0 = __p0_0; \ 391 __ret_0 = splatq_lane_bf16(__s0_0, __p1_0); \ 392 __ret_0; \ 393 }) 394 #else 395 #define vdupq_lane_bf16(__p0_1, __p1_1) __extension__ ({ \ 396 bfloat16x8_t __ret_1; \ 397 bfloat16x4_t __s0_1 = __p0_1; \ 398 bfloat16x4_t __rev0_1; __rev0_1 = __builtin_shufflevector(__s0_1, __s0_1, 3, 2, 1, 0); \ 399 __ret_1 = __noswap_splatq_lane_bf16(__rev0_1, __p1_1); \ 400 __ret_1 = __builtin_shufflevector(__ret_1, __ret_1, 7, 6, 5, 4, 3, 2, 1, 0); \ 401 __ret_1; \ 402 }) 403 #endif 404 405 #ifdef __LITTLE_ENDIAN__ 406 #define vdup_lane_bf16(__p0_2, __p1_2) __extension__ ({ \ 407 bfloat16x4_t __ret_2; \ 408 bfloat16x4_t __s0_2 = __p0_2; \ 409 __ret_2 = splat_lane_bf16(__s0_2, __p1_2); \ 410 __ret_2; \ 411 }) 412 #else 413 #define vdup_lane_bf16(__p0_3, __p1_3) __extension__ ({ \ 414 bfloat16x4_t __ret_3; \ 415 bfloat16x4_t __s0_3 = __p0_3; \ 416 bfloat16x4_t __rev0_3; __rev0_3 = __builtin_shufflevector(__s0_3, __s0_3, 3, 2, 1, 0); \ 417 __ret_3 = __noswap_splat_lane_bf16(__rev0_3, __p1_3); \ 418 __ret_3 = __builtin_shufflevector(__ret_3, __ret_3, 3, 2, 1, 0); \ 419 __ret_3; \ 420 }) 421 #endif 422 423 #ifdef __LITTLE_ENDIAN__ 424 #define vduph_laneq_bf16(__p0, __p1) __extension__ ({ \ 425 bfloat16_t __ret; \ 426 bfloat16x8_t __s0 = __p0; \ 427 __ret = (bfloat16_t) __builtin_neon_vduph_laneq_bf16((bfloat16x8_t)__s0, __p1); \ 428 __ret; \ 429 }) 430 #else 431 #define vduph_laneq_bf16(__p0, __p1) __extension__ ({ \ 432 bfloat16_t __ret; \ 433 bfloat16x8_t __s0 = __p0; \ 434 bfloat16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 435 __ret = (bfloat16_t) __builtin_neon_vduph_laneq_bf16((bfloat16x8_t)__rev0, __p1); \ 436 __ret; \ 437 }) 438 #endif 439 440 #ifdef __LITTLE_ENDIAN__ 441 #define vdupq_laneq_bf16(__p0_4, __p1_4) __extension__ ({ \ 442 bfloat16x8_t __ret_4; \ 443 bfloat16x8_t __s0_4 = __p0_4; \ 444 __ret_4 = splatq_laneq_bf16(__s0_4, __p1_4); \ 445 __ret_4; \ 446 }) 447 #else 448 #define vdupq_laneq_bf16(__p0_5, __p1_5) __extension__ ({ \ 449 bfloat16x8_t __ret_5; \ 450 bfloat16x8_t __s0_5 = __p0_5; \ 451 bfloat16x8_t __rev0_5; __rev0_5 = __builtin_shufflevector(__s0_5, __s0_5, 7, 6, 5, 4, 3, 2, 1, 0); \ 452 __ret_5 = __noswap_splatq_laneq_bf16(__rev0_5, __p1_5); \ 453 __ret_5 = __builtin_shufflevector(__ret_5, __ret_5, 7, 6, 5, 4, 3, 2, 1, 0); \ 454 __ret_5; \ 455 }) 456 #endif 457 458 #ifdef __LITTLE_ENDIAN__ 459 #define vdup_laneq_bf16(__p0_6, __p1_6) __extension__ ({ \ 460 bfloat16x4_t __ret_6; \ 461 bfloat16x8_t __s0_6 = __p0_6; \ 462 __ret_6 = splat_laneq_bf16(__s0_6, __p1_6); \ 463 __ret_6; \ 464 }) 465 #else 466 #define vdup_laneq_bf16(__p0_7, __p1_7) __extension__ ({ \ 467 bfloat16x4_t __ret_7; \ 468 bfloat16x8_t __s0_7 = __p0_7; \ 469 bfloat16x8_t __rev0_7; __rev0_7 = __builtin_shufflevector(__s0_7, __s0_7, 7, 6, 5, 4, 3, 2, 1, 0); \ 470 __ret_7 = __noswap_splat_laneq_bf16(__rev0_7, __p1_7); \ 471 __ret_7 = __builtin_shufflevector(__ret_7, __ret_7, 3, 2, 1, 0); \ 472 __ret_7; \ 473 }) 474 #endif 475 476 #ifdef __LITTLE_ENDIAN__ 477 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vdupq_n_bf16(bfloat16_t __p0) { 478 bfloat16x8_t __ret; 479 __ret = (bfloat16x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 480 return __ret; 481 } 482 #else 483 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vdupq_n_bf16(bfloat16_t __p0) { 484 bfloat16x8_t __ret; 485 __ret = (bfloat16x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 486 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 487 return __ret; 488 } 489 #endif 490 491 #ifdef __LITTLE_ENDIAN__ 492 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vdup_n_bf16(bfloat16_t __p0) { 493 bfloat16x4_t __ret; 494 __ret = (bfloat16x4_t) {__p0, __p0, __p0, __p0}; 495 return __ret; 496 } 497 #else 498 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vdup_n_bf16(bfloat16_t __p0) { 499 bfloat16x4_t __ret; 500 __ret = (bfloat16x4_t) {__p0, __p0, __p0, __p0}; 501 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 502 return __ret; 503 } 504 #endif 505 506 #ifdef __LITTLE_ENDIAN__ 507 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vget_high_bf16(bfloat16x8_t __p0) { 508 bfloat16x4_t __ret; 509 __ret = __builtin_shufflevector(__p0, __p0, 4, 5, 6, 7); 510 return __ret; 511 } 512 #else 513 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vget_high_bf16(bfloat16x8_t __p0) { 514 bfloat16x4_t __ret; 515 bfloat16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 516 __ret = __builtin_shufflevector(__rev0, __rev0, 4, 5, 6, 7); 517 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 518 return __ret; 519 } 520 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t __noswap_vget_high_bf16(bfloat16x8_t __p0) { 521 bfloat16x4_t __ret; 522 __ret = __builtin_shufflevector(__p0, __p0, 4, 5, 6, 7); 523 return __ret; 524 } 525 #endif 526 527 #ifdef __LITTLE_ENDIAN__ 528 #define vgetq_lane_bf16(__p0, __p1) __extension__ ({ \ 529 bfloat16_t __ret; \ 530 bfloat16x8_t __s0 = __p0; \ 531 __ret = (bfloat16_t) __builtin_neon_vgetq_lane_bf16((bfloat16x8_t)__s0, __p1); \ 532 __ret; \ 533 }) 534 #else 535 #define vgetq_lane_bf16(__p0, __p1) __extension__ ({ \ 536 bfloat16_t __ret; \ 537 bfloat16x8_t __s0 = __p0; \ 538 bfloat16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 539 __ret = (bfloat16_t) __builtin_neon_vgetq_lane_bf16((bfloat16x8_t)__rev0, __p1); \ 540 __ret; \ 541 }) 542 #define __noswap_vgetq_lane_bf16(__p0, __p1) __extension__ ({ \ 543 bfloat16_t __ret; \ 544 bfloat16x8_t __s0 = __p0; \ 545 __ret = (bfloat16_t) __builtin_neon_vgetq_lane_bf16((bfloat16x8_t)__s0, __p1); \ 546 __ret; \ 547 }) 548 #endif 549 550 #ifdef __LITTLE_ENDIAN__ 551 #define vget_lane_bf16(__p0, __p1) __extension__ ({ \ 552 bfloat16_t __ret; \ 553 bfloat16x4_t __s0 = __p0; \ 554 __ret = (bfloat16_t) __builtin_neon_vget_lane_bf16((bfloat16x4_t)__s0, __p1); \ 555 __ret; \ 556 }) 557 #else 558 #define vget_lane_bf16(__p0, __p1) __extension__ ({ \ 559 bfloat16_t __ret; \ 560 bfloat16x4_t __s0 = __p0; \ 561 bfloat16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 562 __ret = (bfloat16_t) __builtin_neon_vget_lane_bf16((bfloat16x4_t)__rev0, __p1); \ 563 __ret; \ 564 }) 565 #define __noswap_vget_lane_bf16(__p0, __p1) __extension__ ({ \ 566 bfloat16_t __ret; \ 567 bfloat16x4_t __s0 = __p0; \ 568 __ret = (bfloat16_t) __builtin_neon_vget_lane_bf16((bfloat16x4_t)__s0, __p1); \ 569 __ret; \ 570 }) 571 #endif 572 573 #ifdef __LITTLE_ENDIAN__ 574 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vget_low_bf16(bfloat16x8_t __p0) { 575 bfloat16x4_t __ret; 576 __ret = __builtin_shufflevector(__p0, __p0, 0, 1, 2, 3); 577 return __ret; 578 } 579 #else 580 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vget_low_bf16(bfloat16x8_t __p0) { 581 bfloat16x4_t __ret; 582 bfloat16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 583 __ret = __builtin_shufflevector(__rev0, __rev0, 0, 1, 2, 3); 584 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 585 return __ret; 586 } 587 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t __noswap_vget_low_bf16(bfloat16x8_t __p0) { 588 bfloat16x4_t __ret; 589 __ret = __builtin_shufflevector(__p0, __p0, 0, 1, 2, 3); 590 return __ret; 591 } 592 #endif 593 594 #ifdef __LITTLE_ENDIAN__ 595 #define vld1q_bf16(__p0) __extension__ ({ \ 596 bfloat16x8_t __ret; \ 597 __ret = (bfloat16x8_t) __builtin_neon_vld1q_bf16(__p0, 43); \ 598 __ret; \ 599 }) 600 #else 601 #define vld1q_bf16(__p0) __extension__ ({ \ 602 bfloat16x8_t __ret; \ 603 __ret = (bfloat16x8_t) __builtin_neon_vld1q_bf16(__p0, 43); \ 604 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 605 __ret; \ 606 }) 607 #endif 608 609 #ifdef __LITTLE_ENDIAN__ 610 #define vld1_bf16(__p0) __extension__ ({ \ 611 bfloat16x4_t __ret; \ 612 __ret = (bfloat16x4_t) __builtin_neon_vld1_bf16(__p0, 11); \ 613 __ret; \ 614 }) 615 #else 616 #define vld1_bf16(__p0) __extension__ ({ \ 617 bfloat16x4_t __ret; \ 618 __ret = (bfloat16x4_t) __builtin_neon_vld1_bf16(__p0, 11); \ 619 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 620 __ret; \ 621 }) 622 #endif 623 624 #ifdef __LITTLE_ENDIAN__ 625 #define vld1q_dup_bf16(__p0) __extension__ ({ \ 626 bfloat16x8_t __ret; \ 627 __ret = (bfloat16x8_t) __builtin_neon_vld1q_dup_bf16(__p0, 43); \ 628 __ret; \ 629 }) 630 #else 631 #define vld1q_dup_bf16(__p0) __extension__ ({ \ 632 bfloat16x8_t __ret; \ 633 __ret = (bfloat16x8_t) __builtin_neon_vld1q_dup_bf16(__p0, 43); \ 634 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 635 __ret; \ 636 }) 637 #endif 638 639 #ifdef __LITTLE_ENDIAN__ 640 #define vld1_dup_bf16(__p0) __extension__ ({ \ 641 bfloat16x4_t __ret; \ 642 __ret = (bfloat16x4_t) __builtin_neon_vld1_dup_bf16(__p0, 11); \ 643 __ret; \ 644 }) 645 #else 646 #define vld1_dup_bf16(__p0) __extension__ ({ \ 647 bfloat16x4_t __ret; \ 648 __ret = (bfloat16x4_t) __builtin_neon_vld1_dup_bf16(__p0, 11); \ 649 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 650 __ret; \ 651 }) 652 #endif 653 654 #ifdef __LITTLE_ENDIAN__ 655 #define vld1q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 656 bfloat16x8_t __ret; \ 657 bfloat16x8_t __s1 = __p1; \ 658 __ret = (bfloat16x8_t) __builtin_neon_vld1q_lane_bf16(__p0, (int8x16_t)__s1, __p2, 43); \ 659 __ret; \ 660 }) 661 #else 662 #define vld1q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 663 bfloat16x8_t __ret; \ 664 bfloat16x8_t __s1 = __p1; \ 665 bfloat16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 666 __ret = (bfloat16x8_t) __builtin_neon_vld1q_lane_bf16(__p0, (int8x16_t)__rev1, __p2, 43); \ 667 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 668 __ret; \ 669 }) 670 #endif 671 672 #ifdef __LITTLE_ENDIAN__ 673 #define vld1_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 674 bfloat16x4_t __ret; \ 675 bfloat16x4_t __s1 = __p1; \ 676 __ret = (bfloat16x4_t) __builtin_neon_vld1_lane_bf16(__p0, (int8x8_t)__s1, __p2, 11); \ 677 __ret; \ 678 }) 679 #else 680 #define vld1_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 681 bfloat16x4_t __ret; \ 682 bfloat16x4_t __s1 = __p1; \ 683 bfloat16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 684 __ret = (bfloat16x4_t) __builtin_neon_vld1_lane_bf16(__p0, (int8x8_t)__rev1, __p2, 11); \ 685 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 686 __ret; \ 687 }) 688 #endif 689 690 #ifdef __LITTLE_ENDIAN__ 691 #define vld1q_bf16_x2(__p0) __extension__ ({ \ 692 bfloat16x8x2_t __ret; \ 693 __builtin_neon_vld1q_bf16_x2(&__ret, __p0, 43); \ 694 __ret; \ 695 }) 696 #else 697 #define vld1q_bf16_x2(__p0) __extension__ ({ \ 698 bfloat16x8x2_t __ret; \ 699 __builtin_neon_vld1q_bf16_x2(&__ret, __p0, 43); \ 700 \ 701 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 702 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 703 __ret; \ 704 }) 705 #endif 706 707 #ifdef __LITTLE_ENDIAN__ 708 #define vld1_bf16_x2(__p0) __extension__ ({ \ 709 bfloat16x4x2_t __ret; \ 710 __builtin_neon_vld1_bf16_x2(&__ret, __p0, 11); \ 711 __ret; \ 712 }) 713 #else 714 #define vld1_bf16_x2(__p0) __extension__ ({ \ 715 bfloat16x4x2_t __ret; \ 716 __builtin_neon_vld1_bf16_x2(&__ret, __p0, 11); \ 717 \ 718 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 719 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 720 __ret; \ 721 }) 722 #endif 723 724 #ifdef __LITTLE_ENDIAN__ 725 #define vld1q_bf16_x3(__p0) __extension__ ({ \ 726 bfloat16x8x3_t __ret; \ 727 __builtin_neon_vld1q_bf16_x3(&__ret, __p0, 43); \ 728 __ret; \ 729 }) 730 #else 731 #define vld1q_bf16_x3(__p0) __extension__ ({ \ 732 bfloat16x8x3_t __ret; \ 733 __builtin_neon_vld1q_bf16_x3(&__ret, __p0, 43); \ 734 \ 735 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 736 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 737 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 738 __ret; \ 739 }) 740 #endif 741 742 #ifdef __LITTLE_ENDIAN__ 743 #define vld1_bf16_x3(__p0) __extension__ ({ \ 744 bfloat16x4x3_t __ret; \ 745 __builtin_neon_vld1_bf16_x3(&__ret, __p0, 11); \ 746 __ret; \ 747 }) 748 #else 749 #define vld1_bf16_x3(__p0) __extension__ ({ \ 750 bfloat16x4x3_t __ret; \ 751 __builtin_neon_vld1_bf16_x3(&__ret, __p0, 11); \ 752 \ 753 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 754 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 755 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 756 __ret; \ 757 }) 758 #endif 759 760 #ifdef __LITTLE_ENDIAN__ 761 #define vld1q_bf16_x4(__p0) __extension__ ({ \ 762 bfloat16x8x4_t __ret; \ 763 __builtin_neon_vld1q_bf16_x4(&__ret, __p0, 43); \ 764 __ret; \ 765 }) 766 #else 767 #define vld1q_bf16_x4(__p0) __extension__ ({ \ 768 bfloat16x8x4_t __ret; \ 769 __builtin_neon_vld1q_bf16_x4(&__ret, __p0, 43); \ 770 \ 771 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 772 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 773 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 774 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 775 __ret; \ 776 }) 777 #endif 778 779 #ifdef __LITTLE_ENDIAN__ 780 #define vld1_bf16_x4(__p0) __extension__ ({ \ 781 bfloat16x4x4_t __ret; \ 782 __builtin_neon_vld1_bf16_x4(&__ret, __p0, 11); \ 783 __ret; \ 784 }) 785 #else 786 #define vld1_bf16_x4(__p0) __extension__ ({ \ 787 bfloat16x4x4_t __ret; \ 788 __builtin_neon_vld1_bf16_x4(&__ret, __p0, 11); \ 789 \ 790 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 791 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 792 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 793 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \ 794 __ret; \ 795 }) 796 #endif 797 798 #ifdef __LITTLE_ENDIAN__ 799 #define vld2q_bf16(__p0) __extension__ ({ \ 800 bfloat16x8x2_t __ret; \ 801 __builtin_neon_vld2q_bf16(&__ret, __p0, 43); \ 802 __ret; \ 803 }) 804 #else 805 #define vld2q_bf16(__p0) __extension__ ({ \ 806 bfloat16x8x2_t __ret; \ 807 __builtin_neon_vld2q_bf16(&__ret, __p0, 43); \ 808 \ 809 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 810 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 811 __ret; \ 812 }) 813 #endif 814 815 #ifdef __LITTLE_ENDIAN__ 816 #define vld2_bf16(__p0) __extension__ ({ \ 817 bfloat16x4x2_t __ret; \ 818 __builtin_neon_vld2_bf16(&__ret, __p0, 11); \ 819 __ret; \ 820 }) 821 #else 822 #define vld2_bf16(__p0) __extension__ ({ \ 823 bfloat16x4x2_t __ret; \ 824 __builtin_neon_vld2_bf16(&__ret, __p0, 11); \ 825 \ 826 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 827 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 828 __ret; \ 829 }) 830 #endif 831 832 #ifdef __LITTLE_ENDIAN__ 833 #define vld2q_dup_bf16(__p0) __extension__ ({ \ 834 bfloat16x8x2_t __ret; \ 835 __builtin_neon_vld2q_dup_bf16(&__ret, __p0, 43); \ 836 __ret; \ 837 }) 838 #else 839 #define vld2q_dup_bf16(__p0) __extension__ ({ \ 840 bfloat16x8x2_t __ret; \ 841 __builtin_neon_vld2q_dup_bf16(&__ret, __p0, 43); \ 842 \ 843 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 844 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 845 __ret; \ 846 }) 847 #endif 848 849 #ifdef __LITTLE_ENDIAN__ 850 #define vld2_dup_bf16(__p0) __extension__ ({ \ 851 bfloat16x4x2_t __ret; \ 852 __builtin_neon_vld2_dup_bf16(&__ret, __p0, 11); \ 853 __ret; \ 854 }) 855 #else 856 #define vld2_dup_bf16(__p0) __extension__ ({ \ 857 bfloat16x4x2_t __ret; \ 858 __builtin_neon_vld2_dup_bf16(&__ret, __p0, 11); \ 859 \ 860 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 861 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 862 __ret; \ 863 }) 864 #endif 865 866 #ifdef __LITTLE_ENDIAN__ 867 #define vld2q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 868 bfloat16x8x2_t __ret; \ 869 bfloat16x8x2_t __s1 = __p1; \ 870 __builtin_neon_vld2q_lane_bf16(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 43); \ 871 __ret; \ 872 }) 873 #else 874 #define vld2q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 875 bfloat16x8x2_t __ret; \ 876 bfloat16x8x2_t __s1 = __p1; \ 877 bfloat16x8x2_t __rev1; \ 878 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 879 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 880 __builtin_neon_vld2q_lane_bf16(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 43); \ 881 \ 882 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 883 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 884 __ret; \ 885 }) 886 #endif 887 888 #ifdef __LITTLE_ENDIAN__ 889 #define vld2_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 890 bfloat16x4x2_t __ret; \ 891 bfloat16x4x2_t __s1 = __p1; \ 892 __builtin_neon_vld2_lane_bf16(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 11); \ 893 __ret; \ 894 }) 895 #else 896 #define vld2_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 897 bfloat16x4x2_t __ret; \ 898 bfloat16x4x2_t __s1 = __p1; \ 899 bfloat16x4x2_t __rev1; \ 900 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 901 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 902 __builtin_neon_vld2_lane_bf16(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 11); \ 903 \ 904 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 905 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 906 __ret; \ 907 }) 908 #endif 909 910 #ifdef __LITTLE_ENDIAN__ 911 #define vld3q_bf16(__p0) __extension__ ({ \ 912 bfloat16x8x3_t __ret; \ 913 __builtin_neon_vld3q_bf16(&__ret, __p0, 43); \ 914 __ret; \ 915 }) 916 #else 917 #define vld3q_bf16(__p0) __extension__ ({ \ 918 bfloat16x8x3_t __ret; \ 919 __builtin_neon_vld3q_bf16(&__ret, __p0, 43); \ 920 \ 921 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 922 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 923 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 924 __ret; \ 925 }) 926 #endif 927 928 #ifdef __LITTLE_ENDIAN__ 929 #define vld3_bf16(__p0) __extension__ ({ \ 930 bfloat16x4x3_t __ret; \ 931 __builtin_neon_vld3_bf16(&__ret, __p0, 11); \ 932 __ret; \ 933 }) 934 #else 935 #define vld3_bf16(__p0) __extension__ ({ \ 936 bfloat16x4x3_t __ret; \ 937 __builtin_neon_vld3_bf16(&__ret, __p0, 11); \ 938 \ 939 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 940 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 941 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 942 __ret; \ 943 }) 944 #endif 945 946 #ifdef __LITTLE_ENDIAN__ 947 #define vld3q_dup_bf16(__p0) __extension__ ({ \ 948 bfloat16x8x3_t __ret; \ 949 __builtin_neon_vld3q_dup_bf16(&__ret, __p0, 43); \ 950 __ret; \ 951 }) 952 #else 953 #define vld3q_dup_bf16(__p0) __extension__ ({ \ 954 bfloat16x8x3_t __ret; \ 955 __builtin_neon_vld3q_dup_bf16(&__ret, __p0, 43); \ 956 \ 957 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 958 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 959 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 960 __ret; \ 961 }) 962 #endif 963 964 #ifdef __LITTLE_ENDIAN__ 965 #define vld3_dup_bf16(__p0) __extension__ ({ \ 966 bfloat16x4x3_t __ret; \ 967 __builtin_neon_vld3_dup_bf16(&__ret, __p0, 11); \ 968 __ret; \ 969 }) 970 #else 971 #define vld3_dup_bf16(__p0) __extension__ ({ \ 972 bfloat16x4x3_t __ret; \ 973 __builtin_neon_vld3_dup_bf16(&__ret, __p0, 11); \ 974 \ 975 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 976 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 977 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 978 __ret; \ 979 }) 980 #endif 981 982 #ifdef __LITTLE_ENDIAN__ 983 #define vld3q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 984 bfloat16x8x3_t __ret; \ 985 bfloat16x8x3_t __s1 = __p1; \ 986 __builtin_neon_vld3q_lane_bf16(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 43); \ 987 __ret; \ 988 }) 989 #else 990 #define vld3q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 991 bfloat16x8x3_t __ret; \ 992 bfloat16x8x3_t __s1 = __p1; \ 993 bfloat16x8x3_t __rev1; \ 994 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 995 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 996 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 997 __builtin_neon_vld3q_lane_bf16(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 43); \ 998 \ 999 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 1000 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 1001 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 1002 __ret; \ 1003 }) 1004 #endif 1005 1006 #ifdef __LITTLE_ENDIAN__ 1007 #define vld3_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 1008 bfloat16x4x3_t __ret; \ 1009 bfloat16x4x3_t __s1 = __p1; \ 1010 __builtin_neon_vld3_lane_bf16(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 11); \ 1011 __ret; \ 1012 }) 1013 #else 1014 #define vld3_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 1015 bfloat16x4x3_t __ret; \ 1016 bfloat16x4x3_t __s1 = __p1; \ 1017 bfloat16x4x3_t __rev1; \ 1018 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 1019 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 1020 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 1021 __builtin_neon_vld3_lane_bf16(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 11); \ 1022 \ 1023 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 1024 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 1025 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 1026 __ret; \ 1027 }) 1028 #endif 1029 1030 #ifdef __LITTLE_ENDIAN__ 1031 #define vld4q_bf16(__p0) __extension__ ({ \ 1032 bfloat16x8x4_t __ret; \ 1033 __builtin_neon_vld4q_bf16(&__ret, __p0, 43); \ 1034 __ret; \ 1035 }) 1036 #else 1037 #define vld4q_bf16(__p0) __extension__ ({ \ 1038 bfloat16x8x4_t __ret; \ 1039 __builtin_neon_vld4q_bf16(&__ret, __p0, 43); \ 1040 \ 1041 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 1042 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 1043 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 1044 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 1045 __ret; \ 1046 }) 1047 #endif 1048 1049 #ifdef __LITTLE_ENDIAN__ 1050 #define vld4_bf16(__p0) __extension__ ({ \ 1051 bfloat16x4x4_t __ret; \ 1052 __builtin_neon_vld4_bf16(&__ret, __p0, 11); \ 1053 __ret; \ 1054 }) 1055 #else 1056 #define vld4_bf16(__p0) __extension__ ({ \ 1057 bfloat16x4x4_t __ret; \ 1058 __builtin_neon_vld4_bf16(&__ret, __p0, 11); \ 1059 \ 1060 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 1061 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 1062 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 1063 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \ 1064 __ret; \ 1065 }) 1066 #endif 1067 1068 #ifdef __LITTLE_ENDIAN__ 1069 #define vld4q_dup_bf16(__p0) __extension__ ({ \ 1070 bfloat16x8x4_t __ret; \ 1071 __builtin_neon_vld4q_dup_bf16(&__ret, __p0, 43); \ 1072 __ret; \ 1073 }) 1074 #else 1075 #define vld4q_dup_bf16(__p0) __extension__ ({ \ 1076 bfloat16x8x4_t __ret; \ 1077 __builtin_neon_vld4q_dup_bf16(&__ret, __p0, 43); \ 1078 \ 1079 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 1080 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 1081 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 1082 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 1083 __ret; \ 1084 }) 1085 #endif 1086 1087 #ifdef __LITTLE_ENDIAN__ 1088 #define vld4_dup_bf16(__p0) __extension__ ({ \ 1089 bfloat16x4x4_t __ret; \ 1090 __builtin_neon_vld4_dup_bf16(&__ret, __p0, 11); \ 1091 __ret; \ 1092 }) 1093 #else 1094 #define vld4_dup_bf16(__p0) __extension__ ({ \ 1095 bfloat16x4x4_t __ret; \ 1096 __builtin_neon_vld4_dup_bf16(&__ret, __p0, 11); \ 1097 \ 1098 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 1099 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 1100 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 1101 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \ 1102 __ret; \ 1103 }) 1104 #endif 1105 1106 #ifdef __LITTLE_ENDIAN__ 1107 #define vld4q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 1108 bfloat16x8x4_t __ret; \ 1109 bfloat16x8x4_t __s1 = __p1; \ 1110 __builtin_neon_vld4q_lane_bf16(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 43); \ 1111 __ret; \ 1112 }) 1113 #else 1114 #define vld4q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 1115 bfloat16x8x4_t __ret; \ 1116 bfloat16x8x4_t __s1 = __p1; \ 1117 bfloat16x8x4_t __rev1; \ 1118 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 1119 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 1120 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 1121 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 1122 __builtin_neon_vld4q_lane_bf16(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 43); \ 1123 \ 1124 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 1125 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 1126 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 1127 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 1128 __ret; \ 1129 }) 1130 #endif 1131 1132 #ifdef __LITTLE_ENDIAN__ 1133 #define vld4_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 1134 bfloat16x4x4_t __ret; \ 1135 bfloat16x4x4_t __s1 = __p1; \ 1136 __builtin_neon_vld4_lane_bf16(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 11); \ 1137 __ret; \ 1138 }) 1139 #else 1140 #define vld4_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 1141 bfloat16x4x4_t __ret; \ 1142 bfloat16x4x4_t __s1 = __p1; \ 1143 bfloat16x4x4_t __rev1; \ 1144 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 1145 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 1146 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 1147 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \ 1148 __builtin_neon_vld4_lane_bf16(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 11); \ 1149 \ 1150 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 1151 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 1152 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 1153 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \ 1154 __ret; \ 1155 }) 1156 #endif 1157 1158 #ifdef __LITTLE_ENDIAN__ 1159 #define vsetq_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 1160 bfloat16x8_t __ret; \ 1161 bfloat16_t __s0 = __p0; \ 1162 bfloat16x8_t __s1 = __p1; \ 1163 __ret = (bfloat16x8_t) __builtin_neon_vsetq_lane_bf16(__s0, (bfloat16x8_t)__s1, __p2); \ 1164 __ret; \ 1165 }) 1166 #else 1167 #define vsetq_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 1168 bfloat16x8_t __ret; \ 1169 bfloat16_t __s0 = __p0; \ 1170 bfloat16x8_t __s1 = __p1; \ 1171 bfloat16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 1172 __ret = (bfloat16x8_t) __builtin_neon_vsetq_lane_bf16(__s0, (bfloat16x8_t)__rev1, __p2); \ 1173 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 1174 __ret; \ 1175 }) 1176 #define __noswap_vsetq_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 1177 bfloat16x8_t __ret; \ 1178 bfloat16_t __s0 = __p0; \ 1179 bfloat16x8_t __s1 = __p1; \ 1180 __ret = (bfloat16x8_t) __builtin_neon_vsetq_lane_bf16(__s0, (bfloat16x8_t)__s1, __p2); \ 1181 __ret; \ 1182 }) 1183 #endif 1184 1185 #ifdef __LITTLE_ENDIAN__ 1186 #define vset_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 1187 bfloat16x4_t __ret; \ 1188 bfloat16_t __s0 = __p0; \ 1189 bfloat16x4_t __s1 = __p1; \ 1190 __ret = (bfloat16x4_t) __builtin_neon_vset_lane_bf16(__s0, (bfloat16x4_t)__s1, __p2); \ 1191 __ret; \ 1192 }) 1193 #else 1194 #define vset_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 1195 bfloat16x4_t __ret; \ 1196 bfloat16_t __s0 = __p0; \ 1197 bfloat16x4_t __s1 = __p1; \ 1198 bfloat16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 1199 __ret = (bfloat16x4_t) __builtin_neon_vset_lane_bf16(__s0, (bfloat16x4_t)__rev1, __p2); \ 1200 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 1201 __ret; \ 1202 }) 1203 #define __noswap_vset_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 1204 bfloat16x4_t __ret; \ 1205 bfloat16_t __s0 = __p0; \ 1206 bfloat16x4_t __s1 = __p1; \ 1207 __ret = (bfloat16x4_t) __builtin_neon_vset_lane_bf16(__s0, (bfloat16x4_t)__s1, __p2); \ 1208 __ret; \ 1209 }) 1210 #endif 1211 1212 #ifdef __LITTLE_ENDIAN__ 1213 #define vst1q_bf16(__p0, __p1) __extension__ ({ \ 1214 bfloat16x8_t __s1 = __p1; \ 1215 __builtin_neon_vst1q_bf16(__p0, (int8x16_t)__s1, 43); \ 1216 }) 1217 #else 1218 #define vst1q_bf16(__p0, __p1) __extension__ ({ \ 1219 bfloat16x8_t __s1 = __p1; \ 1220 bfloat16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 1221 __builtin_neon_vst1q_bf16(__p0, (int8x16_t)__rev1, 43); \ 1222 }) 1223 #endif 1224 1225 #ifdef __LITTLE_ENDIAN__ 1226 #define vst1_bf16(__p0, __p1) __extension__ ({ \ 1227 bfloat16x4_t __s1 = __p1; \ 1228 __builtin_neon_vst1_bf16(__p0, (int8x8_t)__s1, 11); \ 1229 }) 1230 #else 1231 #define vst1_bf16(__p0, __p1) __extension__ ({ \ 1232 bfloat16x4_t __s1 = __p1; \ 1233 bfloat16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 1234 __builtin_neon_vst1_bf16(__p0, (int8x8_t)__rev1, 11); \ 1235 }) 1236 #endif 1237 1238 #ifdef __LITTLE_ENDIAN__ 1239 #define vst1q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 1240 bfloat16x8_t __s1 = __p1; \ 1241 __builtin_neon_vst1q_lane_bf16(__p0, (int8x16_t)__s1, __p2, 43); \ 1242 }) 1243 #else 1244 #define vst1q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 1245 bfloat16x8_t __s1 = __p1; \ 1246 bfloat16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 1247 __builtin_neon_vst1q_lane_bf16(__p0, (int8x16_t)__rev1, __p2, 43); \ 1248 }) 1249 #endif 1250 1251 #ifdef __LITTLE_ENDIAN__ 1252 #define vst1_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 1253 bfloat16x4_t __s1 = __p1; \ 1254 __builtin_neon_vst1_lane_bf16(__p0, (int8x8_t)__s1, __p2, 11); \ 1255 }) 1256 #else 1257 #define vst1_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 1258 bfloat16x4_t __s1 = __p1; \ 1259 bfloat16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 1260 __builtin_neon_vst1_lane_bf16(__p0, (int8x8_t)__rev1, __p2, 11); \ 1261 }) 1262 #endif 1263 1264 #ifdef __LITTLE_ENDIAN__ 1265 #define vst1q_bf16_x2(__p0, __p1) __extension__ ({ \ 1266 bfloat16x8x2_t __s1 = __p1; \ 1267 __builtin_neon_vst1q_bf16_x2(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 43); \ 1268 }) 1269 #else 1270 #define vst1q_bf16_x2(__p0, __p1) __extension__ ({ \ 1271 bfloat16x8x2_t __s1 = __p1; \ 1272 bfloat16x8x2_t __rev1; \ 1273 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 1274 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 1275 __builtin_neon_vst1q_bf16_x2(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 43); \ 1276 }) 1277 #endif 1278 1279 #ifdef __LITTLE_ENDIAN__ 1280 #define vst1_bf16_x2(__p0, __p1) __extension__ ({ \ 1281 bfloat16x4x2_t __s1 = __p1; \ 1282 __builtin_neon_vst1_bf16_x2(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 11); \ 1283 }) 1284 #else 1285 #define vst1_bf16_x2(__p0, __p1) __extension__ ({ \ 1286 bfloat16x4x2_t __s1 = __p1; \ 1287 bfloat16x4x2_t __rev1; \ 1288 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 1289 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 1290 __builtin_neon_vst1_bf16_x2(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 11); \ 1291 }) 1292 #endif 1293 1294 #ifdef __LITTLE_ENDIAN__ 1295 #define vst1q_bf16_x3(__p0, __p1) __extension__ ({ \ 1296 bfloat16x8x3_t __s1 = __p1; \ 1297 __builtin_neon_vst1q_bf16_x3(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 43); \ 1298 }) 1299 #else 1300 #define vst1q_bf16_x3(__p0, __p1) __extension__ ({ \ 1301 bfloat16x8x3_t __s1 = __p1; \ 1302 bfloat16x8x3_t __rev1; \ 1303 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 1304 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 1305 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 1306 __builtin_neon_vst1q_bf16_x3(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 43); \ 1307 }) 1308 #endif 1309 1310 #ifdef __LITTLE_ENDIAN__ 1311 #define vst1_bf16_x3(__p0, __p1) __extension__ ({ \ 1312 bfloat16x4x3_t __s1 = __p1; \ 1313 __builtin_neon_vst1_bf16_x3(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 11); \ 1314 }) 1315 #else 1316 #define vst1_bf16_x3(__p0, __p1) __extension__ ({ \ 1317 bfloat16x4x3_t __s1 = __p1; \ 1318 bfloat16x4x3_t __rev1; \ 1319 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 1320 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 1321 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 1322 __builtin_neon_vst1_bf16_x3(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 11); \ 1323 }) 1324 #endif 1325 1326 #ifdef __LITTLE_ENDIAN__ 1327 #define vst1q_bf16_x4(__p0, __p1) __extension__ ({ \ 1328 bfloat16x8x4_t __s1 = __p1; \ 1329 __builtin_neon_vst1q_bf16_x4(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 43); \ 1330 }) 1331 #else 1332 #define vst1q_bf16_x4(__p0, __p1) __extension__ ({ \ 1333 bfloat16x8x4_t __s1 = __p1; \ 1334 bfloat16x8x4_t __rev1; \ 1335 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 1336 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 1337 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 1338 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 1339 __builtin_neon_vst1q_bf16_x4(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 43); \ 1340 }) 1341 #endif 1342 1343 #ifdef __LITTLE_ENDIAN__ 1344 #define vst1_bf16_x4(__p0, __p1) __extension__ ({ \ 1345 bfloat16x4x4_t __s1 = __p1; \ 1346 __builtin_neon_vst1_bf16_x4(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 11); \ 1347 }) 1348 #else 1349 #define vst1_bf16_x4(__p0, __p1) __extension__ ({ \ 1350 bfloat16x4x4_t __s1 = __p1; \ 1351 bfloat16x4x4_t __rev1; \ 1352 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 1353 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 1354 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 1355 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \ 1356 __builtin_neon_vst1_bf16_x4(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 11); \ 1357 }) 1358 #endif 1359 1360 #ifdef __LITTLE_ENDIAN__ 1361 #define vst2q_bf16(__p0, __p1) __extension__ ({ \ 1362 bfloat16x8x2_t __s1 = __p1; \ 1363 __builtin_neon_vst2q_bf16(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 43); \ 1364 }) 1365 #else 1366 #define vst2q_bf16(__p0, __p1) __extension__ ({ \ 1367 bfloat16x8x2_t __s1 = __p1; \ 1368 bfloat16x8x2_t __rev1; \ 1369 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 1370 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 1371 __builtin_neon_vst2q_bf16(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 43); \ 1372 }) 1373 #endif 1374 1375 #ifdef __LITTLE_ENDIAN__ 1376 #define vst2_bf16(__p0, __p1) __extension__ ({ \ 1377 bfloat16x4x2_t __s1 = __p1; \ 1378 __builtin_neon_vst2_bf16(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 11); \ 1379 }) 1380 #else 1381 #define vst2_bf16(__p0, __p1) __extension__ ({ \ 1382 bfloat16x4x2_t __s1 = __p1; \ 1383 bfloat16x4x2_t __rev1; \ 1384 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 1385 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 1386 __builtin_neon_vst2_bf16(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 11); \ 1387 }) 1388 #endif 1389 1390 #ifdef __LITTLE_ENDIAN__ 1391 #define vst2q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 1392 bfloat16x8x2_t __s1 = __p1; \ 1393 __builtin_neon_vst2q_lane_bf16(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 43); \ 1394 }) 1395 #else 1396 #define vst2q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 1397 bfloat16x8x2_t __s1 = __p1; \ 1398 bfloat16x8x2_t __rev1; \ 1399 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 1400 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 1401 __builtin_neon_vst2q_lane_bf16(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 43); \ 1402 }) 1403 #endif 1404 1405 #ifdef __LITTLE_ENDIAN__ 1406 #define vst2_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 1407 bfloat16x4x2_t __s1 = __p1; \ 1408 __builtin_neon_vst2_lane_bf16(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 11); \ 1409 }) 1410 #else 1411 #define vst2_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 1412 bfloat16x4x2_t __s1 = __p1; \ 1413 bfloat16x4x2_t __rev1; \ 1414 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 1415 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 1416 __builtin_neon_vst2_lane_bf16(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 11); \ 1417 }) 1418 #endif 1419 1420 #ifdef __LITTLE_ENDIAN__ 1421 #define vst3q_bf16(__p0, __p1) __extension__ ({ \ 1422 bfloat16x8x3_t __s1 = __p1; \ 1423 __builtin_neon_vst3q_bf16(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 43); \ 1424 }) 1425 #else 1426 #define vst3q_bf16(__p0, __p1) __extension__ ({ \ 1427 bfloat16x8x3_t __s1 = __p1; \ 1428 bfloat16x8x3_t __rev1; \ 1429 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 1430 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 1431 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 1432 __builtin_neon_vst3q_bf16(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 43); \ 1433 }) 1434 #endif 1435 1436 #ifdef __LITTLE_ENDIAN__ 1437 #define vst3_bf16(__p0, __p1) __extension__ ({ \ 1438 bfloat16x4x3_t __s1 = __p1; \ 1439 __builtin_neon_vst3_bf16(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 11); \ 1440 }) 1441 #else 1442 #define vst3_bf16(__p0, __p1) __extension__ ({ \ 1443 bfloat16x4x3_t __s1 = __p1; \ 1444 bfloat16x4x3_t __rev1; \ 1445 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 1446 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 1447 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 1448 __builtin_neon_vst3_bf16(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 11); \ 1449 }) 1450 #endif 1451 1452 #ifdef __LITTLE_ENDIAN__ 1453 #define vst3q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 1454 bfloat16x8x3_t __s1 = __p1; \ 1455 __builtin_neon_vst3q_lane_bf16(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 43); \ 1456 }) 1457 #else 1458 #define vst3q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 1459 bfloat16x8x3_t __s1 = __p1; \ 1460 bfloat16x8x3_t __rev1; \ 1461 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 1462 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 1463 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 1464 __builtin_neon_vst3q_lane_bf16(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 43); \ 1465 }) 1466 #endif 1467 1468 #ifdef __LITTLE_ENDIAN__ 1469 #define vst3_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 1470 bfloat16x4x3_t __s1 = __p1; \ 1471 __builtin_neon_vst3_lane_bf16(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 11); \ 1472 }) 1473 #else 1474 #define vst3_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 1475 bfloat16x4x3_t __s1 = __p1; \ 1476 bfloat16x4x3_t __rev1; \ 1477 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 1478 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 1479 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 1480 __builtin_neon_vst3_lane_bf16(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 11); \ 1481 }) 1482 #endif 1483 1484 #ifdef __LITTLE_ENDIAN__ 1485 #define vst4q_bf16(__p0, __p1) __extension__ ({ \ 1486 bfloat16x8x4_t __s1 = __p1; \ 1487 __builtin_neon_vst4q_bf16(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 43); \ 1488 }) 1489 #else 1490 #define vst4q_bf16(__p0, __p1) __extension__ ({ \ 1491 bfloat16x8x4_t __s1 = __p1; \ 1492 bfloat16x8x4_t __rev1; \ 1493 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 1494 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 1495 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 1496 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 1497 __builtin_neon_vst4q_bf16(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 43); \ 1498 }) 1499 #endif 1500 1501 #ifdef __LITTLE_ENDIAN__ 1502 #define vst4_bf16(__p0, __p1) __extension__ ({ \ 1503 bfloat16x4x4_t __s1 = __p1; \ 1504 __builtin_neon_vst4_bf16(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 11); \ 1505 }) 1506 #else 1507 #define vst4_bf16(__p0, __p1) __extension__ ({ \ 1508 bfloat16x4x4_t __s1 = __p1; \ 1509 bfloat16x4x4_t __rev1; \ 1510 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 1511 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 1512 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 1513 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \ 1514 __builtin_neon_vst4_bf16(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 11); \ 1515 }) 1516 #endif 1517 1518 #ifdef __LITTLE_ENDIAN__ 1519 #define vst4q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 1520 bfloat16x8x4_t __s1 = __p1; \ 1521 __builtin_neon_vst4q_lane_bf16(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 43); \ 1522 }) 1523 #else 1524 #define vst4q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 1525 bfloat16x8x4_t __s1 = __p1; \ 1526 bfloat16x8x4_t __rev1; \ 1527 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 1528 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 1529 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 1530 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 1531 __builtin_neon_vst4q_lane_bf16(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 43); \ 1532 }) 1533 #endif 1534 1535 #ifdef __LITTLE_ENDIAN__ 1536 #define vst4_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 1537 bfloat16x4x4_t __s1 = __p1; \ 1538 __builtin_neon_vst4_lane_bf16(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 11); \ 1539 }) 1540 #else 1541 #define vst4_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 1542 bfloat16x4x4_t __s1 = __p1; \ 1543 bfloat16x4x4_t __rev1; \ 1544 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 1545 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 1546 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 1547 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \ 1548 __builtin_neon_vst4_lane_bf16(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 11); \ 1549 }) 1550 #endif 1551 1552 #ifdef __LITTLE_ENDIAN__ 1553 __ai __attribute__((target("dotprod,neon"))) uint32x4_t vdotq_u32(uint32x4_t __p0, uint8x16_t __p1, uint8x16_t __p2) { 1554 uint32x4_t __ret; 1555 __ret = (uint32x4_t) __builtin_neon_vdotq_u32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 50); 1556 return __ret; 1557 } 1558 #else 1559 __ai __attribute__((target("dotprod,neon"))) uint32x4_t vdotq_u32(uint32x4_t __p0, uint8x16_t __p1, uint8x16_t __p2) { 1560 uint32x4_t __ret; 1561 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 1562 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 1563 uint8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 1564 __ret = (uint32x4_t) __builtin_neon_vdotq_u32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 50); 1565 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 1566 return __ret; 1567 } 1568 __ai __attribute__((target("dotprod,neon"))) uint32x4_t __noswap_vdotq_u32(uint32x4_t __p0, uint8x16_t __p1, uint8x16_t __p2) { 1569 uint32x4_t __ret; 1570 __ret = (uint32x4_t) __builtin_neon_vdotq_u32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 50); 1571 return __ret; 1572 } 1573 #endif 1574 1575 #ifdef __LITTLE_ENDIAN__ 1576 __ai __attribute__((target("dotprod,neon"))) int32x4_t vdotq_s32(int32x4_t __p0, int8x16_t __p1, int8x16_t __p2) { 1577 int32x4_t __ret; 1578 __ret = (int32x4_t) __builtin_neon_vdotq_s32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 34); 1579 return __ret; 1580 } 1581 #else 1582 __ai __attribute__((target("dotprod,neon"))) int32x4_t vdotq_s32(int32x4_t __p0, int8x16_t __p1, int8x16_t __p2) { 1583 int32x4_t __ret; 1584 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 1585 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 1586 int8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 1587 __ret = (int32x4_t) __builtin_neon_vdotq_s32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 34); 1588 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 1589 return __ret; 1590 } 1591 __ai __attribute__((target("dotprod,neon"))) int32x4_t __noswap_vdotq_s32(int32x4_t __p0, int8x16_t __p1, int8x16_t __p2) { 1592 int32x4_t __ret; 1593 __ret = (int32x4_t) __builtin_neon_vdotq_s32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 34); 1594 return __ret; 1595 } 1596 #endif 1597 1598 #ifdef __LITTLE_ENDIAN__ 1599 __ai __attribute__((target("dotprod,neon"))) uint32x2_t vdot_u32(uint32x2_t __p0, uint8x8_t __p1, uint8x8_t __p2) { 1600 uint32x2_t __ret; 1601 __ret = (uint32x2_t) __builtin_neon_vdot_u32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 18); 1602 return __ret; 1603 } 1604 #else 1605 __ai __attribute__((target("dotprod,neon"))) uint32x2_t vdot_u32(uint32x2_t __p0, uint8x8_t __p1, uint8x8_t __p2) { 1606 uint32x2_t __ret; 1607 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 1608 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 1609 uint8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 1610 __ret = (uint32x2_t) __builtin_neon_vdot_u32((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 18); 1611 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 1612 return __ret; 1613 } 1614 __ai __attribute__((target("dotprod,neon"))) uint32x2_t __noswap_vdot_u32(uint32x2_t __p0, uint8x8_t __p1, uint8x8_t __p2) { 1615 uint32x2_t __ret; 1616 __ret = (uint32x2_t) __builtin_neon_vdot_u32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 18); 1617 return __ret; 1618 } 1619 #endif 1620 1621 #ifdef __LITTLE_ENDIAN__ 1622 __ai __attribute__((target("dotprod,neon"))) int32x2_t vdot_s32(int32x2_t __p0, int8x8_t __p1, int8x8_t __p2) { 1623 int32x2_t __ret; 1624 __ret = (int32x2_t) __builtin_neon_vdot_s32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 2); 1625 return __ret; 1626 } 1627 #else 1628 __ai __attribute__((target("dotprod,neon"))) int32x2_t vdot_s32(int32x2_t __p0, int8x8_t __p1, int8x8_t __p2) { 1629 int32x2_t __ret; 1630 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 1631 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 1632 int8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 1633 __ret = (int32x2_t) __builtin_neon_vdot_s32((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 2); 1634 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 1635 return __ret; 1636 } 1637 __ai __attribute__((target("dotprod,neon"))) int32x2_t __noswap_vdot_s32(int32x2_t __p0, int8x8_t __p1, int8x8_t __p2) { 1638 int32x2_t __ret; 1639 __ret = (int32x2_t) __builtin_neon_vdot_s32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 2); 1640 return __ret; 1641 } 1642 #endif 1643 1644 #ifdef __LITTLE_ENDIAN__ 1645 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vabdq_f16(float16x8_t __p0, float16x8_t __p1) { 1646 float16x8_t __ret; 1647 __ret = (float16x8_t) __builtin_neon_vabdq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40); 1648 return __ret; 1649 } 1650 #else 1651 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vabdq_f16(float16x8_t __p0, float16x8_t __p1) { 1652 float16x8_t __ret; 1653 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 1654 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 1655 __ret = (float16x8_t) __builtin_neon_vabdq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40); 1656 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 1657 return __ret; 1658 } 1659 #endif 1660 1661 #ifdef __LITTLE_ENDIAN__ 1662 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vabd_f16(float16x4_t __p0, float16x4_t __p1) { 1663 float16x4_t __ret; 1664 __ret = (float16x4_t) __builtin_neon_vabd_f16((int8x8_t)__p0, (int8x8_t)__p1, 8); 1665 return __ret; 1666 } 1667 #else 1668 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vabd_f16(float16x4_t __p0, float16x4_t __p1) { 1669 float16x4_t __ret; 1670 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 1671 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 1672 __ret = (float16x4_t) __builtin_neon_vabd_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8); 1673 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 1674 return __ret; 1675 } 1676 #endif 1677 1678 #ifdef __LITTLE_ENDIAN__ 1679 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vabsq_f16(float16x8_t __p0) { 1680 float16x8_t __ret; 1681 __ret = (float16x8_t) __builtin_neon_vabsq_f16((int8x16_t)__p0, 40); 1682 return __ret; 1683 } 1684 #else 1685 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vabsq_f16(float16x8_t __p0) { 1686 float16x8_t __ret; 1687 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 1688 __ret = (float16x8_t) __builtin_neon_vabsq_f16((int8x16_t)__rev0, 40); 1689 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 1690 return __ret; 1691 } 1692 #endif 1693 1694 #ifdef __LITTLE_ENDIAN__ 1695 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vabs_f16(float16x4_t __p0) { 1696 float16x4_t __ret; 1697 __ret = (float16x4_t) __builtin_neon_vabs_f16((int8x8_t)__p0, 8); 1698 return __ret; 1699 } 1700 #else 1701 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vabs_f16(float16x4_t __p0) { 1702 float16x4_t __ret; 1703 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 1704 __ret = (float16x4_t) __builtin_neon_vabs_f16((int8x8_t)__rev0, 8); 1705 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 1706 return __ret; 1707 } 1708 #endif 1709 1710 #ifdef __LITTLE_ENDIAN__ 1711 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vaddq_f16(float16x8_t __p0, float16x8_t __p1) { 1712 float16x8_t __ret; 1713 __ret = __p0 + __p1; 1714 return __ret; 1715 } 1716 #else 1717 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vaddq_f16(float16x8_t __p0, float16x8_t __p1) { 1718 float16x8_t __ret; 1719 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 1720 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 1721 __ret = __rev0 + __rev1; 1722 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 1723 return __ret; 1724 } 1725 #endif 1726 1727 #ifdef __LITTLE_ENDIAN__ 1728 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vadd_f16(float16x4_t __p0, float16x4_t __p1) { 1729 float16x4_t __ret; 1730 __ret = __p0 + __p1; 1731 return __ret; 1732 } 1733 #else 1734 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vadd_f16(float16x4_t __p0, float16x4_t __p1) { 1735 float16x4_t __ret; 1736 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 1737 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 1738 __ret = __rev0 + __rev1; 1739 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 1740 return __ret; 1741 } 1742 #endif 1743 1744 #ifdef __LITTLE_ENDIAN__ 1745 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcageq_f16(float16x8_t __p0, float16x8_t __p1) { 1746 uint16x8_t __ret; 1747 __ret = (uint16x8_t) __builtin_neon_vcageq_f16((int8x16_t)__p0, (int8x16_t)__p1, 49); 1748 return __ret; 1749 } 1750 #else 1751 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcageq_f16(float16x8_t __p0, float16x8_t __p1) { 1752 uint16x8_t __ret; 1753 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 1754 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 1755 __ret = (uint16x8_t) __builtin_neon_vcageq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 49); 1756 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 1757 return __ret; 1758 } 1759 #endif 1760 1761 #ifdef __LITTLE_ENDIAN__ 1762 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcage_f16(float16x4_t __p0, float16x4_t __p1) { 1763 uint16x4_t __ret; 1764 __ret = (uint16x4_t) __builtin_neon_vcage_f16((int8x8_t)__p0, (int8x8_t)__p1, 17); 1765 return __ret; 1766 } 1767 #else 1768 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcage_f16(float16x4_t __p0, float16x4_t __p1) { 1769 uint16x4_t __ret; 1770 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 1771 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 1772 __ret = (uint16x4_t) __builtin_neon_vcage_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 17); 1773 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 1774 return __ret; 1775 } 1776 #endif 1777 1778 #ifdef __LITTLE_ENDIAN__ 1779 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcagtq_f16(float16x8_t __p0, float16x8_t __p1) { 1780 uint16x8_t __ret; 1781 __ret = (uint16x8_t) __builtin_neon_vcagtq_f16((int8x16_t)__p0, (int8x16_t)__p1, 49); 1782 return __ret; 1783 } 1784 #else 1785 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcagtq_f16(float16x8_t __p0, float16x8_t __p1) { 1786 uint16x8_t __ret; 1787 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 1788 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 1789 __ret = (uint16x8_t) __builtin_neon_vcagtq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 49); 1790 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 1791 return __ret; 1792 } 1793 #endif 1794 1795 #ifdef __LITTLE_ENDIAN__ 1796 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcagt_f16(float16x4_t __p0, float16x4_t __p1) { 1797 uint16x4_t __ret; 1798 __ret = (uint16x4_t) __builtin_neon_vcagt_f16((int8x8_t)__p0, (int8x8_t)__p1, 17); 1799 return __ret; 1800 } 1801 #else 1802 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcagt_f16(float16x4_t __p0, float16x4_t __p1) { 1803 uint16x4_t __ret; 1804 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 1805 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 1806 __ret = (uint16x4_t) __builtin_neon_vcagt_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 17); 1807 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 1808 return __ret; 1809 } 1810 #endif 1811 1812 #ifdef __LITTLE_ENDIAN__ 1813 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcaleq_f16(float16x8_t __p0, float16x8_t __p1) { 1814 uint16x8_t __ret; 1815 __ret = (uint16x8_t) __builtin_neon_vcaleq_f16((int8x16_t)__p0, (int8x16_t)__p1, 49); 1816 return __ret; 1817 } 1818 #else 1819 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcaleq_f16(float16x8_t __p0, float16x8_t __p1) { 1820 uint16x8_t __ret; 1821 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 1822 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 1823 __ret = (uint16x8_t) __builtin_neon_vcaleq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 49); 1824 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 1825 return __ret; 1826 } 1827 #endif 1828 1829 #ifdef __LITTLE_ENDIAN__ 1830 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcale_f16(float16x4_t __p0, float16x4_t __p1) { 1831 uint16x4_t __ret; 1832 __ret = (uint16x4_t) __builtin_neon_vcale_f16((int8x8_t)__p0, (int8x8_t)__p1, 17); 1833 return __ret; 1834 } 1835 #else 1836 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcale_f16(float16x4_t __p0, float16x4_t __p1) { 1837 uint16x4_t __ret; 1838 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 1839 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 1840 __ret = (uint16x4_t) __builtin_neon_vcale_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 17); 1841 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 1842 return __ret; 1843 } 1844 #endif 1845 1846 #ifdef __LITTLE_ENDIAN__ 1847 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcaltq_f16(float16x8_t __p0, float16x8_t __p1) { 1848 uint16x8_t __ret; 1849 __ret = (uint16x8_t) __builtin_neon_vcaltq_f16((int8x16_t)__p0, (int8x16_t)__p1, 49); 1850 return __ret; 1851 } 1852 #else 1853 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcaltq_f16(float16x8_t __p0, float16x8_t __p1) { 1854 uint16x8_t __ret; 1855 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 1856 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 1857 __ret = (uint16x8_t) __builtin_neon_vcaltq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 49); 1858 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 1859 return __ret; 1860 } 1861 #endif 1862 1863 #ifdef __LITTLE_ENDIAN__ 1864 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcalt_f16(float16x4_t __p0, float16x4_t __p1) { 1865 uint16x4_t __ret; 1866 __ret = (uint16x4_t) __builtin_neon_vcalt_f16((int8x8_t)__p0, (int8x8_t)__p1, 17); 1867 return __ret; 1868 } 1869 #else 1870 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcalt_f16(float16x4_t __p0, float16x4_t __p1) { 1871 uint16x4_t __ret; 1872 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 1873 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 1874 __ret = (uint16x4_t) __builtin_neon_vcalt_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 17); 1875 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 1876 return __ret; 1877 } 1878 #endif 1879 1880 #ifdef __LITTLE_ENDIAN__ 1881 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vceqq_f16(float16x8_t __p0, float16x8_t __p1) { 1882 uint16x8_t __ret; 1883 __ret = (uint16x8_t)(__p0 == __p1); 1884 return __ret; 1885 } 1886 #else 1887 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vceqq_f16(float16x8_t __p0, float16x8_t __p1) { 1888 uint16x8_t __ret; 1889 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 1890 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 1891 __ret = (uint16x8_t)(__rev0 == __rev1); 1892 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 1893 return __ret; 1894 } 1895 #endif 1896 1897 #ifdef __LITTLE_ENDIAN__ 1898 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vceq_f16(float16x4_t __p0, float16x4_t __p1) { 1899 uint16x4_t __ret; 1900 __ret = (uint16x4_t)(__p0 == __p1); 1901 return __ret; 1902 } 1903 #else 1904 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vceq_f16(float16x4_t __p0, float16x4_t __p1) { 1905 uint16x4_t __ret; 1906 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 1907 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 1908 __ret = (uint16x4_t)(__rev0 == __rev1); 1909 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 1910 return __ret; 1911 } 1912 #endif 1913 1914 #ifdef __LITTLE_ENDIAN__ 1915 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vceqzq_f16(float16x8_t __p0) { 1916 uint16x8_t __ret; 1917 __ret = (uint16x8_t) __builtin_neon_vceqzq_f16((int8x16_t)__p0, 49); 1918 return __ret; 1919 } 1920 #else 1921 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vceqzq_f16(float16x8_t __p0) { 1922 uint16x8_t __ret; 1923 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 1924 __ret = (uint16x8_t) __builtin_neon_vceqzq_f16((int8x16_t)__rev0, 49); 1925 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 1926 return __ret; 1927 } 1928 #endif 1929 1930 #ifdef __LITTLE_ENDIAN__ 1931 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vceqz_f16(float16x4_t __p0) { 1932 uint16x4_t __ret; 1933 __ret = (uint16x4_t) __builtin_neon_vceqz_f16((int8x8_t)__p0, 17); 1934 return __ret; 1935 } 1936 #else 1937 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vceqz_f16(float16x4_t __p0) { 1938 uint16x4_t __ret; 1939 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 1940 __ret = (uint16x4_t) __builtin_neon_vceqz_f16((int8x8_t)__rev0, 17); 1941 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 1942 return __ret; 1943 } 1944 #endif 1945 1946 #ifdef __LITTLE_ENDIAN__ 1947 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcgeq_f16(float16x8_t __p0, float16x8_t __p1) { 1948 uint16x8_t __ret; 1949 __ret = (uint16x8_t)(__p0 >= __p1); 1950 return __ret; 1951 } 1952 #else 1953 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcgeq_f16(float16x8_t __p0, float16x8_t __p1) { 1954 uint16x8_t __ret; 1955 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 1956 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 1957 __ret = (uint16x8_t)(__rev0 >= __rev1); 1958 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 1959 return __ret; 1960 } 1961 #endif 1962 1963 #ifdef __LITTLE_ENDIAN__ 1964 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcge_f16(float16x4_t __p0, float16x4_t __p1) { 1965 uint16x4_t __ret; 1966 __ret = (uint16x4_t)(__p0 >= __p1); 1967 return __ret; 1968 } 1969 #else 1970 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcge_f16(float16x4_t __p0, float16x4_t __p1) { 1971 uint16x4_t __ret; 1972 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 1973 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 1974 __ret = (uint16x4_t)(__rev0 >= __rev1); 1975 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 1976 return __ret; 1977 } 1978 #endif 1979 1980 #ifdef __LITTLE_ENDIAN__ 1981 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcgezq_f16(float16x8_t __p0) { 1982 uint16x8_t __ret; 1983 __ret = (uint16x8_t) __builtin_neon_vcgezq_f16((int8x16_t)__p0, 49); 1984 return __ret; 1985 } 1986 #else 1987 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcgezq_f16(float16x8_t __p0) { 1988 uint16x8_t __ret; 1989 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 1990 __ret = (uint16x8_t) __builtin_neon_vcgezq_f16((int8x16_t)__rev0, 49); 1991 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 1992 return __ret; 1993 } 1994 #endif 1995 1996 #ifdef __LITTLE_ENDIAN__ 1997 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcgez_f16(float16x4_t __p0) { 1998 uint16x4_t __ret; 1999 __ret = (uint16x4_t) __builtin_neon_vcgez_f16((int8x8_t)__p0, 17); 2000 return __ret; 2001 } 2002 #else 2003 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcgez_f16(float16x4_t __p0) { 2004 uint16x4_t __ret; 2005 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 2006 __ret = (uint16x4_t) __builtin_neon_vcgez_f16((int8x8_t)__rev0, 17); 2007 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 2008 return __ret; 2009 } 2010 #endif 2011 2012 #ifdef __LITTLE_ENDIAN__ 2013 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcgtq_f16(float16x8_t __p0, float16x8_t __p1) { 2014 uint16x8_t __ret; 2015 __ret = (uint16x8_t)(__p0 > __p1); 2016 return __ret; 2017 } 2018 #else 2019 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcgtq_f16(float16x8_t __p0, float16x8_t __p1) { 2020 uint16x8_t __ret; 2021 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 2022 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 2023 __ret = (uint16x8_t)(__rev0 > __rev1); 2024 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 2025 return __ret; 2026 } 2027 #endif 2028 2029 #ifdef __LITTLE_ENDIAN__ 2030 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcgt_f16(float16x4_t __p0, float16x4_t __p1) { 2031 uint16x4_t __ret; 2032 __ret = (uint16x4_t)(__p0 > __p1); 2033 return __ret; 2034 } 2035 #else 2036 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcgt_f16(float16x4_t __p0, float16x4_t __p1) { 2037 uint16x4_t __ret; 2038 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 2039 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 2040 __ret = (uint16x4_t)(__rev0 > __rev1); 2041 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 2042 return __ret; 2043 } 2044 #endif 2045 2046 #ifdef __LITTLE_ENDIAN__ 2047 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcgtzq_f16(float16x8_t __p0) { 2048 uint16x8_t __ret; 2049 __ret = (uint16x8_t) __builtin_neon_vcgtzq_f16((int8x16_t)__p0, 49); 2050 return __ret; 2051 } 2052 #else 2053 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcgtzq_f16(float16x8_t __p0) { 2054 uint16x8_t __ret; 2055 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 2056 __ret = (uint16x8_t) __builtin_neon_vcgtzq_f16((int8x16_t)__rev0, 49); 2057 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 2058 return __ret; 2059 } 2060 #endif 2061 2062 #ifdef __LITTLE_ENDIAN__ 2063 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcgtz_f16(float16x4_t __p0) { 2064 uint16x4_t __ret; 2065 __ret = (uint16x4_t) __builtin_neon_vcgtz_f16((int8x8_t)__p0, 17); 2066 return __ret; 2067 } 2068 #else 2069 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcgtz_f16(float16x4_t __p0) { 2070 uint16x4_t __ret; 2071 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 2072 __ret = (uint16x4_t) __builtin_neon_vcgtz_f16((int8x8_t)__rev0, 17); 2073 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 2074 return __ret; 2075 } 2076 #endif 2077 2078 #ifdef __LITTLE_ENDIAN__ 2079 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcleq_f16(float16x8_t __p0, float16x8_t __p1) { 2080 uint16x8_t __ret; 2081 __ret = (uint16x8_t)(__p0 <= __p1); 2082 return __ret; 2083 } 2084 #else 2085 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcleq_f16(float16x8_t __p0, float16x8_t __p1) { 2086 uint16x8_t __ret; 2087 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 2088 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 2089 __ret = (uint16x8_t)(__rev0 <= __rev1); 2090 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 2091 return __ret; 2092 } 2093 #endif 2094 2095 #ifdef __LITTLE_ENDIAN__ 2096 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcle_f16(float16x4_t __p0, float16x4_t __p1) { 2097 uint16x4_t __ret; 2098 __ret = (uint16x4_t)(__p0 <= __p1); 2099 return __ret; 2100 } 2101 #else 2102 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcle_f16(float16x4_t __p0, float16x4_t __p1) { 2103 uint16x4_t __ret; 2104 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 2105 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 2106 __ret = (uint16x4_t)(__rev0 <= __rev1); 2107 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 2108 return __ret; 2109 } 2110 #endif 2111 2112 #ifdef __LITTLE_ENDIAN__ 2113 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vclezq_f16(float16x8_t __p0) { 2114 uint16x8_t __ret; 2115 __ret = (uint16x8_t) __builtin_neon_vclezq_f16((int8x16_t)__p0, 49); 2116 return __ret; 2117 } 2118 #else 2119 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vclezq_f16(float16x8_t __p0) { 2120 uint16x8_t __ret; 2121 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 2122 __ret = (uint16x8_t) __builtin_neon_vclezq_f16((int8x16_t)__rev0, 49); 2123 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 2124 return __ret; 2125 } 2126 #endif 2127 2128 #ifdef __LITTLE_ENDIAN__ 2129 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vclez_f16(float16x4_t __p0) { 2130 uint16x4_t __ret; 2131 __ret = (uint16x4_t) __builtin_neon_vclez_f16((int8x8_t)__p0, 17); 2132 return __ret; 2133 } 2134 #else 2135 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vclez_f16(float16x4_t __p0) { 2136 uint16x4_t __ret; 2137 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 2138 __ret = (uint16x4_t) __builtin_neon_vclez_f16((int8x8_t)__rev0, 17); 2139 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 2140 return __ret; 2141 } 2142 #endif 2143 2144 #ifdef __LITTLE_ENDIAN__ 2145 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcltq_f16(float16x8_t __p0, float16x8_t __p1) { 2146 uint16x8_t __ret; 2147 __ret = (uint16x8_t)(__p0 < __p1); 2148 return __ret; 2149 } 2150 #else 2151 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcltq_f16(float16x8_t __p0, float16x8_t __p1) { 2152 uint16x8_t __ret; 2153 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 2154 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 2155 __ret = (uint16x8_t)(__rev0 < __rev1); 2156 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 2157 return __ret; 2158 } 2159 #endif 2160 2161 #ifdef __LITTLE_ENDIAN__ 2162 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vclt_f16(float16x4_t __p0, float16x4_t __p1) { 2163 uint16x4_t __ret; 2164 __ret = (uint16x4_t)(__p0 < __p1); 2165 return __ret; 2166 } 2167 #else 2168 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vclt_f16(float16x4_t __p0, float16x4_t __p1) { 2169 uint16x4_t __ret; 2170 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 2171 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 2172 __ret = (uint16x4_t)(__rev0 < __rev1); 2173 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 2174 return __ret; 2175 } 2176 #endif 2177 2178 #ifdef __LITTLE_ENDIAN__ 2179 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcltzq_f16(float16x8_t __p0) { 2180 uint16x8_t __ret; 2181 __ret = (uint16x8_t) __builtin_neon_vcltzq_f16((int8x16_t)__p0, 49); 2182 return __ret; 2183 } 2184 #else 2185 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcltzq_f16(float16x8_t __p0) { 2186 uint16x8_t __ret; 2187 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 2188 __ret = (uint16x8_t) __builtin_neon_vcltzq_f16((int8x16_t)__rev0, 49); 2189 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 2190 return __ret; 2191 } 2192 #endif 2193 2194 #ifdef __LITTLE_ENDIAN__ 2195 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcltz_f16(float16x4_t __p0) { 2196 uint16x4_t __ret; 2197 __ret = (uint16x4_t) __builtin_neon_vcltz_f16((int8x8_t)__p0, 17); 2198 return __ret; 2199 } 2200 #else 2201 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcltz_f16(float16x4_t __p0) { 2202 uint16x4_t __ret; 2203 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 2204 __ret = (uint16x4_t) __builtin_neon_vcltz_f16((int8x8_t)__rev0, 17); 2205 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 2206 return __ret; 2207 } 2208 #endif 2209 2210 #ifdef __LITTLE_ENDIAN__ 2211 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vcvtq_f16_u16(uint16x8_t __p0) { 2212 float16x8_t __ret; 2213 __ret = (float16x8_t) __builtin_neon_vcvtq_f16_u16((int8x16_t)__p0, 49); 2214 return __ret; 2215 } 2216 #else 2217 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vcvtq_f16_u16(uint16x8_t __p0) { 2218 float16x8_t __ret; 2219 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 2220 __ret = (float16x8_t) __builtin_neon_vcvtq_f16_u16((int8x16_t)__rev0, 49); 2221 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 2222 return __ret; 2223 } 2224 #endif 2225 2226 #ifdef __LITTLE_ENDIAN__ 2227 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vcvtq_f16_s16(int16x8_t __p0) { 2228 float16x8_t __ret; 2229 __ret = (float16x8_t) __builtin_neon_vcvtq_f16_s16((int8x16_t)__p0, 33); 2230 return __ret; 2231 } 2232 #else 2233 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vcvtq_f16_s16(int16x8_t __p0) { 2234 float16x8_t __ret; 2235 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 2236 __ret = (float16x8_t) __builtin_neon_vcvtq_f16_s16((int8x16_t)__rev0, 33); 2237 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 2238 return __ret; 2239 } 2240 #endif 2241 2242 #ifdef __LITTLE_ENDIAN__ 2243 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vcvt_f16_u16(uint16x4_t __p0) { 2244 float16x4_t __ret; 2245 __ret = (float16x4_t) __builtin_neon_vcvt_f16_u16((int8x8_t)__p0, 17); 2246 return __ret; 2247 } 2248 #else 2249 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vcvt_f16_u16(uint16x4_t __p0) { 2250 float16x4_t __ret; 2251 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 2252 __ret = (float16x4_t) __builtin_neon_vcvt_f16_u16((int8x8_t)__rev0, 17); 2253 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 2254 return __ret; 2255 } 2256 #endif 2257 2258 #ifdef __LITTLE_ENDIAN__ 2259 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vcvt_f16_s16(int16x4_t __p0) { 2260 float16x4_t __ret; 2261 __ret = (float16x4_t) __builtin_neon_vcvt_f16_s16((int8x8_t)__p0, 1); 2262 return __ret; 2263 } 2264 #else 2265 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vcvt_f16_s16(int16x4_t __p0) { 2266 float16x4_t __ret; 2267 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 2268 __ret = (float16x4_t) __builtin_neon_vcvt_f16_s16((int8x8_t)__rev0, 1); 2269 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 2270 return __ret; 2271 } 2272 #endif 2273 2274 #ifdef __LITTLE_ENDIAN__ 2275 #define vcvtq_n_f16_u16(__p0, __p1) __extension__ ({ \ 2276 float16x8_t __ret; \ 2277 uint16x8_t __s0 = __p0; \ 2278 __ret = (float16x8_t) __builtin_neon_vcvtq_n_f16_u16((int8x16_t)__s0, __p1, 49); \ 2279 __ret; \ 2280 }) 2281 #else 2282 #define vcvtq_n_f16_u16(__p0, __p1) __extension__ ({ \ 2283 float16x8_t __ret; \ 2284 uint16x8_t __s0 = __p0; \ 2285 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 2286 __ret = (float16x8_t) __builtin_neon_vcvtq_n_f16_u16((int8x16_t)__rev0, __p1, 49); \ 2287 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 2288 __ret; \ 2289 }) 2290 #endif 2291 2292 #ifdef __LITTLE_ENDIAN__ 2293 #define vcvtq_n_f16_s16(__p0, __p1) __extension__ ({ \ 2294 float16x8_t __ret; \ 2295 int16x8_t __s0 = __p0; \ 2296 __ret = (float16x8_t) __builtin_neon_vcvtq_n_f16_s16((int8x16_t)__s0, __p1, 33); \ 2297 __ret; \ 2298 }) 2299 #else 2300 #define vcvtq_n_f16_s16(__p0, __p1) __extension__ ({ \ 2301 float16x8_t __ret; \ 2302 int16x8_t __s0 = __p0; \ 2303 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 2304 __ret = (float16x8_t) __builtin_neon_vcvtq_n_f16_s16((int8x16_t)__rev0, __p1, 33); \ 2305 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 2306 __ret; \ 2307 }) 2308 #endif 2309 2310 #ifdef __LITTLE_ENDIAN__ 2311 #define vcvt_n_f16_u16(__p0, __p1) __extension__ ({ \ 2312 float16x4_t __ret; \ 2313 uint16x4_t __s0 = __p0; \ 2314 __ret = (float16x4_t) __builtin_neon_vcvt_n_f16_u16((int8x8_t)__s0, __p1, 17); \ 2315 __ret; \ 2316 }) 2317 #else 2318 #define vcvt_n_f16_u16(__p0, __p1) __extension__ ({ \ 2319 float16x4_t __ret; \ 2320 uint16x4_t __s0 = __p0; \ 2321 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 2322 __ret = (float16x4_t) __builtin_neon_vcvt_n_f16_u16((int8x8_t)__rev0, __p1, 17); \ 2323 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 2324 __ret; \ 2325 }) 2326 #endif 2327 2328 #ifdef __LITTLE_ENDIAN__ 2329 #define vcvt_n_f16_s16(__p0, __p1) __extension__ ({ \ 2330 float16x4_t __ret; \ 2331 int16x4_t __s0 = __p0; \ 2332 __ret = (float16x4_t) __builtin_neon_vcvt_n_f16_s16((int8x8_t)__s0, __p1, 1); \ 2333 __ret; \ 2334 }) 2335 #else 2336 #define vcvt_n_f16_s16(__p0, __p1) __extension__ ({ \ 2337 float16x4_t __ret; \ 2338 int16x4_t __s0 = __p0; \ 2339 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 2340 __ret = (float16x4_t) __builtin_neon_vcvt_n_f16_s16((int8x8_t)__rev0, __p1, 1); \ 2341 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 2342 __ret; \ 2343 }) 2344 #endif 2345 2346 #ifdef __LITTLE_ENDIAN__ 2347 #define vcvtq_n_s16_f16(__p0, __p1) __extension__ ({ \ 2348 int16x8_t __ret; \ 2349 float16x8_t __s0 = __p0; \ 2350 __ret = (int16x8_t) __builtin_neon_vcvtq_n_s16_f16((int8x16_t)__s0, __p1, 33); \ 2351 __ret; \ 2352 }) 2353 #else 2354 #define vcvtq_n_s16_f16(__p0, __p1) __extension__ ({ \ 2355 int16x8_t __ret; \ 2356 float16x8_t __s0 = __p0; \ 2357 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 2358 __ret = (int16x8_t) __builtin_neon_vcvtq_n_s16_f16((int8x16_t)__rev0, __p1, 33); \ 2359 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 2360 __ret; \ 2361 }) 2362 #endif 2363 2364 #ifdef __LITTLE_ENDIAN__ 2365 #define vcvt_n_s16_f16(__p0, __p1) __extension__ ({ \ 2366 int16x4_t __ret; \ 2367 float16x4_t __s0 = __p0; \ 2368 __ret = (int16x4_t) __builtin_neon_vcvt_n_s16_f16((int8x8_t)__s0, __p1, 1); \ 2369 __ret; \ 2370 }) 2371 #else 2372 #define vcvt_n_s16_f16(__p0, __p1) __extension__ ({ \ 2373 int16x4_t __ret; \ 2374 float16x4_t __s0 = __p0; \ 2375 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 2376 __ret = (int16x4_t) __builtin_neon_vcvt_n_s16_f16((int8x8_t)__rev0, __p1, 1); \ 2377 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 2378 __ret; \ 2379 }) 2380 #endif 2381 2382 #ifdef __LITTLE_ENDIAN__ 2383 #define vcvtq_n_u16_f16(__p0, __p1) __extension__ ({ \ 2384 uint16x8_t __ret; \ 2385 float16x8_t __s0 = __p0; \ 2386 __ret = (uint16x8_t) __builtin_neon_vcvtq_n_u16_f16((int8x16_t)__s0, __p1, 49); \ 2387 __ret; \ 2388 }) 2389 #else 2390 #define vcvtq_n_u16_f16(__p0, __p1) __extension__ ({ \ 2391 uint16x8_t __ret; \ 2392 float16x8_t __s0 = __p0; \ 2393 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 2394 __ret = (uint16x8_t) __builtin_neon_vcvtq_n_u16_f16((int8x16_t)__rev0, __p1, 49); \ 2395 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 2396 __ret; \ 2397 }) 2398 #endif 2399 2400 #ifdef __LITTLE_ENDIAN__ 2401 #define vcvt_n_u16_f16(__p0, __p1) __extension__ ({ \ 2402 uint16x4_t __ret; \ 2403 float16x4_t __s0 = __p0; \ 2404 __ret = (uint16x4_t) __builtin_neon_vcvt_n_u16_f16((int8x8_t)__s0, __p1, 17); \ 2405 __ret; \ 2406 }) 2407 #else 2408 #define vcvt_n_u16_f16(__p0, __p1) __extension__ ({ \ 2409 uint16x4_t __ret; \ 2410 float16x4_t __s0 = __p0; \ 2411 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 2412 __ret = (uint16x4_t) __builtin_neon_vcvt_n_u16_f16((int8x8_t)__rev0, __p1, 17); \ 2413 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 2414 __ret; \ 2415 }) 2416 #endif 2417 2418 #ifdef __LITTLE_ENDIAN__ 2419 __ai __attribute__((target("fullfp16,neon"))) int16x8_t vcvtq_s16_f16(float16x8_t __p0) { 2420 int16x8_t __ret; 2421 __ret = (int16x8_t) __builtin_neon_vcvtq_s16_f16((int8x16_t)__p0, 33); 2422 return __ret; 2423 } 2424 #else 2425 __ai __attribute__((target("fullfp16,neon"))) int16x8_t vcvtq_s16_f16(float16x8_t __p0) { 2426 int16x8_t __ret; 2427 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 2428 __ret = (int16x8_t) __builtin_neon_vcvtq_s16_f16((int8x16_t)__rev0, 33); 2429 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 2430 return __ret; 2431 } 2432 #endif 2433 2434 #ifdef __LITTLE_ENDIAN__ 2435 __ai __attribute__((target("fullfp16,neon"))) int16x4_t vcvt_s16_f16(float16x4_t __p0) { 2436 int16x4_t __ret; 2437 __ret = (int16x4_t) __builtin_neon_vcvt_s16_f16((int8x8_t)__p0, 1); 2438 return __ret; 2439 } 2440 #else 2441 __ai __attribute__((target("fullfp16,neon"))) int16x4_t vcvt_s16_f16(float16x4_t __p0) { 2442 int16x4_t __ret; 2443 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 2444 __ret = (int16x4_t) __builtin_neon_vcvt_s16_f16((int8x8_t)__rev0, 1); 2445 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 2446 return __ret; 2447 } 2448 #endif 2449 2450 #ifdef __LITTLE_ENDIAN__ 2451 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcvtq_u16_f16(float16x8_t __p0) { 2452 uint16x8_t __ret; 2453 __ret = (uint16x8_t) __builtin_neon_vcvtq_u16_f16((int8x16_t)__p0, 49); 2454 return __ret; 2455 } 2456 #else 2457 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcvtq_u16_f16(float16x8_t __p0) { 2458 uint16x8_t __ret; 2459 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 2460 __ret = (uint16x8_t) __builtin_neon_vcvtq_u16_f16((int8x16_t)__rev0, 49); 2461 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 2462 return __ret; 2463 } 2464 #endif 2465 2466 #ifdef __LITTLE_ENDIAN__ 2467 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcvt_u16_f16(float16x4_t __p0) { 2468 uint16x4_t __ret; 2469 __ret = (uint16x4_t) __builtin_neon_vcvt_u16_f16((int8x8_t)__p0, 17); 2470 return __ret; 2471 } 2472 #else 2473 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcvt_u16_f16(float16x4_t __p0) { 2474 uint16x4_t __ret; 2475 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 2476 __ret = (uint16x4_t) __builtin_neon_vcvt_u16_f16((int8x8_t)__rev0, 17); 2477 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 2478 return __ret; 2479 } 2480 #endif 2481 2482 #ifdef __LITTLE_ENDIAN__ 2483 __ai __attribute__((target("fullfp16,neon"))) int16x8_t vcvtaq_s16_f16(float16x8_t __p0) { 2484 int16x8_t __ret; 2485 __ret = (int16x8_t) __builtin_neon_vcvtaq_s16_f16((int8x16_t)__p0, 33); 2486 return __ret; 2487 } 2488 #else 2489 __ai __attribute__((target("fullfp16,neon"))) int16x8_t vcvtaq_s16_f16(float16x8_t __p0) { 2490 int16x8_t __ret; 2491 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 2492 __ret = (int16x8_t) __builtin_neon_vcvtaq_s16_f16((int8x16_t)__rev0, 33); 2493 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 2494 return __ret; 2495 } 2496 #endif 2497 2498 #ifdef __LITTLE_ENDIAN__ 2499 __ai __attribute__((target("fullfp16,neon"))) int16x4_t vcvta_s16_f16(float16x4_t __p0) { 2500 int16x4_t __ret; 2501 __ret = (int16x4_t) __builtin_neon_vcvta_s16_f16((int8x8_t)__p0, 1); 2502 return __ret; 2503 } 2504 #else 2505 __ai __attribute__((target("fullfp16,neon"))) int16x4_t vcvta_s16_f16(float16x4_t __p0) { 2506 int16x4_t __ret; 2507 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 2508 __ret = (int16x4_t) __builtin_neon_vcvta_s16_f16((int8x8_t)__rev0, 1); 2509 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 2510 return __ret; 2511 } 2512 #endif 2513 2514 #ifdef __LITTLE_ENDIAN__ 2515 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcvtaq_u16_f16(float16x8_t __p0) { 2516 uint16x8_t __ret; 2517 __ret = (uint16x8_t) __builtin_neon_vcvtaq_u16_f16((int8x16_t)__p0, 49); 2518 return __ret; 2519 } 2520 #else 2521 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcvtaq_u16_f16(float16x8_t __p0) { 2522 uint16x8_t __ret; 2523 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 2524 __ret = (uint16x8_t) __builtin_neon_vcvtaq_u16_f16((int8x16_t)__rev0, 49); 2525 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 2526 return __ret; 2527 } 2528 #endif 2529 2530 #ifdef __LITTLE_ENDIAN__ 2531 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcvta_u16_f16(float16x4_t __p0) { 2532 uint16x4_t __ret; 2533 __ret = (uint16x4_t) __builtin_neon_vcvta_u16_f16((int8x8_t)__p0, 17); 2534 return __ret; 2535 } 2536 #else 2537 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcvta_u16_f16(float16x4_t __p0) { 2538 uint16x4_t __ret; 2539 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 2540 __ret = (uint16x4_t) __builtin_neon_vcvta_u16_f16((int8x8_t)__rev0, 17); 2541 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 2542 return __ret; 2543 } 2544 #endif 2545 2546 #ifdef __LITTLE_ENDIAN__ 2547 __ai __attribute__((target("fullfp16,neon"))) int16x8_t vcvtmq_s16_f16(float16x8_t __p0) { 2548 int16x8_t __ret; 2549 __ret = (int16x8_t) __builtin_neon_vcvtmq_s16_f16((int8x16_t)__p0, 33); 2550 return __ret; 2551 } 2552 #else 2553 __ai __attribute__((target("fullfp16,neon"))) int16x8_t vcvtmq_s16_f16(float16x8_t __p0) { 2554 int16x8_t __ret; 2555 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 2556 __ret = (int16x8_t) __builtin_neon_vcvtmq_s16_f16((int8x16_t)__rev0, 33); 2557 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 2558 return __ret; 2559 } 2560 #endif 2561 2562 #ifdef __LITTLE_ENDIAN__ 2563 __ai __attribute__((target("fullfp16,neon"))) int16x4_t vcvtm_s16_f16(float16x4_t __p0) { 2564 int16x4_t __ret; 2565 __ret = (int16x4_t) __builtin_neon_vcvtm_s16_f16((int8x8_t)__p0, 1); 2566 return __ret; 2567 } 2568 #else 2569 __ai __attribute__((target("fullfp16,neon"))) int16x4_t vcvtm_s16_f16(float16x4_t __p0) { 2570 int16x4_t __ret; 2571 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 2572 __ret = (int16x4_t) __builtin_neon_vcvtm_s16_f16((int8x8_t)__rev0, 1); 2573 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 2574 return __ret; 2575 } 2576 #endif 2577 2578 #ifdef __LITTLE_ENDIAN__ 2579 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcvtmq_u16_f16(float16x8_t __p0) { 2580 uint16x8_t __ret; 2581 __ret = (uint16x8_t) __builtin_neon_vcvtmq_u16_f16((int8x16_t)__p0, 49); 2582 return __ret; 2583 } 2584 #else 2585 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcvtmq_u16_f16(float16x8_t __p0) { 2586 uint16x8_t __ret; 2587 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 2588 __ret = (uint16x8_t) __builtin_neon_vcvtmq_u16_f16((int8x16_t)__rev0, 49); 2589 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 2590 return __ret; 2591 } 2592 #endif 2593 2594 #ifdef __LITTLE_ENDIAN__ 2595 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcvtm_u16_f16(float16x4_t __p0) { 2596 uint16x4_t __ret; 2597 __ret = (uint16x4_t) __builtin_neon_vcvtm_u16_f16((int8x8_t)__p0, 17); 2598 return __ret; 2599 } 2600 #else 2601 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcvtm_u16_f16(float16x4_t __p0) { 2602 uint16x4_t __ret; 2603 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 2604 __ret = (uint16x4_t) __builtin_neon_vcvtm_u16_f16((int8x8_t)__rev0, 17); 2605 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 2606 return __ret; 2607 } 2608 #endif 2609 2610 #ifdef __LITTLE_ENDIAN__ 2611 __ai __attribute__((target("fullfp16,neon"))) int16x8_t vcvtnq_s16_f16(float16x8_t __p0) { 2612 int16x8_t __ret; 2613 __ret = (int16x8_t) __builtin_neon_vcvtnq_s16_f16((int8x16_t)__p0, 33); 2614 return __ret; 2615 } 2616 #else 2617 __ai __attribute__((target("fullfp16,neon"))) int16x8_t vcvtnq_s16_f16(float16x8_t __p0) { 2618 int16x8_t __ret; 2619 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 2620 __ret = (int16x8_t) __builtin_neon_vcvtnq_s16_f16((int8x16_t)__rev0, 33); 2621 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 2622 return __ret; 2623 } 2624 #endif 2625 2626 #ifdef __LITTLE_ENDIAN__ 2627 __ai __attribute__((target("fullfp16,neon"))) int16x4_t vcvtn_s16_f16(float16x4_t __p0) { 2628 int16x4_t __ret; 2629 __ret = (int16x4_t) __builtin_neon_vcvtn_s16_f16((int8x8_t)__p0, 1); 2630 return __ret; 2631 } 2632 #else 2633 __ai __attribute__((target("fullfp16,neon"))) int16x4_t vcvtn_s16_f16(float16x4_t __p0) { 2634 int16x4_t __ret; 2635 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 2636 __ret = (int16x4_t) __builtin_neon_vcvtn_s16_f16((int8x8_t)__rev0, 1); 2637 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 2638 return __ret; 2639 } 2640 #endif 2641 2642 #ifdef __LITTLE_ENDIAN__ 2643 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcvtnq_u16_f16(float16x8_t __p0) { 2644 uint16x8_t __ret; 2645 __ret = (uint16x8_t) __builtin_neon_vcvtnq_u16_f16((int8x16_t)__p0, 49); 2646 return __ret; 2647 } 2648 #else 2649 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcvtnq_u16_f16(float16x8_t __p0) { 2650 uint16x8_t __ret; 2651 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 2652 __ret = (uint16x8_t) __builtin_neon_vcvtnq_u16_f16((int8x16_t)__rev0, 49); 2653 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 2654 return __ret; 2655 } 2656 #endif 2657 2658 #ifdef __LITTLE_ENDIAN__ 2659 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcvtn_u16_f16(float16x4_t __p0) { 2660 uint16x4_t __ret; 2661 __ret = (uint16x4_t) __builtin_neon_vcvtn_u16_f16((int8x8_t)__p0, 17); 2662 return __ret; 2663 } 2664 #else 2665 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcvtn_u16_f16(float16x4_t __p0) { 2666 uint16x4_t __ret; 2667 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 2668 __ret = (uint16x4_t) __builtin_neon_vcvtn_u16_f16((int8x8_t)__rev0, 17); 2669 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 2670 return __ret; 2671 } 2672 #endif 2673 2674 #ifdef __LITTLE_ENDIAN__ 2675 __ai __attribute__((target("fullfp16,neon"))) int16x8_t vcvtpq_s16_f16(float16x8_t __p0) { 2676 int16x8_t __ret; 2677 __ret = (int16x8_t) __builtin_neon_vcvtpq_s16_f16((int8x16_t)__p0, 33); 2678 return __ret; 2679 } 2680 #else 2681 __ai __attribute__((target("fullfp16,neon"))) int16x8_t vcvtpq_s16_f16(float16x8_t __p0) { 2682 int16x8_t __ret; 2683 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 2684 __ret = (int16x8_t) __builtin_neon_vcvtpq_s16_f16((int8x16_t)__rev0, 33); 2685 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 2686 return __ret; 2687 } 2688 #endif 2689 2690 #ifdef __LITTLE_ENDIAN__ 2691 __ai __attribute__((target("fullfp16,neon"))) int16x4_t vcvtp_s16_f16(float16x4_t __p0) { 2692 int16x4_t __ret; 2693 __ret = (int16x4_t) __builtin_neon_vcvtp_s16_f16((int8x8_t)__p0, 1); 2694 return __ret; 2695 } 2696 #else 2697 __ai __attribute__((target("fullfp16,neon"))) int16x4_t vcvtp_s16_f16(float16x4_t __p0) { 2698 int16x4_t __ret; 2699 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 2700 __ret = (int16x4_t) __builtin_neon_vcvtp_s16_f16((int8x8_t)__rev0, 1); 2701 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 2702 return __ret; 2703 } 2704 #endif 2705 2706 #ifdef __LITTLE_ENDIAN__ 2707 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcvtpq_u16_f16(float16x8_t __p0) { 2708 uint16x8_t __ret; 2709 __ret = (uint16x8_t) __builtin_neon_vcvtpq_u16_f16((int8x16_t)__p0, 49); 2710 return __ret; 2711 } 2712 #else 2713 __ai __attribute__((target("fullfp16,neon"))) uint16x8_t vcvtpq_u16_f16(float16x8_t __p0) { 2714 uint16x8_t __ret; 2715 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 2716 __ret = (uint16x8_t) __builtin_neon_vcvtpq_u16_f16((int8x16_t)__rev0, 49); 2717 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 2718 return __ret; 2719 } 2720 #endif 2721 2722 #ifdef __LITTLE_ENDIAN__ 2723 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcvtp_u16_f16(float16x4_t __p0) { 2724 uint16x4_t __ret; 2725 __ret = (uint16x4_t) __builtin_neon_vcvtp_u16_f16((int8x8_t)__p0, 17); 2726 return __ret; 2727 } 2728 #else 2729 __ai __attribute__((target("fullfp16,neon"))) uint16x4_t vcvtp_u16_f16(float16x4_t __p0) { 2730 uint16x4_t __ret; 2731 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 2732 __ret = (uint16x4_t) __builtin_neon_vcvtp_u16_f16((int8x8_t)__rev0, 17); 2733 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 2734 return __ret; 2735 } 2736 #endif 2737 2738 #ifdef __LITTLE_ENDIAN__ 2739 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vfmaq_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) { 2740 float16x8_t __ret; 2741 __ret = (float16x8_t) __builtin_neon_vfmaq_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 40); 2742 return __ret; 2743 } 2744 #else 2745 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vfmaq_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) { 2746 float16x8_t __ret; 2747 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 2748 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 2749 float16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 2750 __ret = (float16x8_t) __builtin_neon_vfmaq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 40); 2751 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 2752 return __ret; 2753 } 2754 __ai __attribute__((target("fullfp16,neon"))) float16x8_t __noswap_vfmaq_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) { 2755 float16x8_t __ret; 2756 __ret = (float16x8_t) __builtin_neon_vfmaq_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 40); 2757 return __ret; 2758 } 2759 #endif 2760 2761 #ifdef __LITTLE_ENDIAN__ 2762 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vfma_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) { 2763 float16x4_t __ret; 2764 __ret = (float16x4_t) __builtin_neon_vfma_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 8); 2765 return __ret; 2766 } 2767 #else 2768 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vfma_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) { 2769 float16x4_t __ret; 2770 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 2771 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 2772 float16x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 2773 __ret = (float16x4_t) __builtin_neon_vfma_f16((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 8); 2774 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 2775 return __ret; 2776 } 2777 __ai __attribute__((target("fullfp16,neon"))) float16x4_t __noswap_vfma_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) { 2778 float16x4_t __ret; 2779 __ret = (float16x4_t) __builtin_neon_vfma_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 8); 2780 return __ret; 2781 } 2782 #endif 2783 2784 #ifdef __LITTLE_ENDIAN__ 2785 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vfmsq_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) { 2786 float16x8_t __ret; 2787 __ret = vfmaq_f16(__p0, -__p1, __p2); 2788 return __ret; 2789 } 2790 #else 2791 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vfmsq_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) { 2792 float16x8_t __ret; 2793 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 2794 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 2795 float16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 2796 __ret = __noswap_vfmaq_f16(__rev0, -__rev1, __rev2); 2797 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 2798 return __ret; 2799 } 2800 #endif 2801 2802 #ifdef __LITTLE_ENDIAN__ 2803 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vfms_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) { 2804 float16x4_t __ret; 2805 __ret = vfma_f16(__p0, -__p1, __p2); 2806 return __ret; 2807 } 2808 #else 2809 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vfms_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) { 2810 float16x4_t __ret; 2811 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 2812 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 2813 float16x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 2814 __ret = __noswap_vfma_f16(__rev0, -__rev1, __rev2); 2815 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 2816 return __ret; 2817 } 2818 #endif 2819 2820 #ifdef __LITTLE_ENDIAN__ 2821 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vmaxq_f16(float16x8_t __p0, float16x8_t __p1) { 2822 float16x8_t __ret; 2823 __ret = (float16x8_t) __builtin_neon_vmaxq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40); 2824 return __ret; 2825 } 2826 #else 2827 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vmaxq_f16(float16x8_t __p0, float16x8_t __p1) { 2828 float16x8_t __ret; 2829 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 2830 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 2831 __ret = (float16x8_t) __builtin_neon_vmaxq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40); 2832 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 2833 return __ret; 2834 } 2835 #endif 2836 2837 #ifdef __LITTLE_ENDIAN__ 2838 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vmax_f16(float16x4_t __p0, float16x4_t __p1) { 2839 float16x4_t __ret; 2840 __ret = (float16x4_t) __builtin_neon_vmax_f16((int8x8_t)__p0, (int8x8_t)__p1, 8); 2841 return __ret; 2842 } 2843 #else 2844 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vmax_f16(float16x4_t __p0, float16x4_t __p1) { 2845 float16x4_t __ret; 2846 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 2847 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 2848 __ret = (float16x4_t) __builtin_neon_vmax_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8); 2849 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 2850 return __ret; 2851 } 2852 #endif 2853 2854 #ifdef __LITTLE_ENDIAN__ 2855 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vminq_f16(float16x8_t __p0, float16x8_t __p1) { 2856 float16x8_t __ret; 2857 __ret = (float16x8_t) __builtin_neon_vminq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40); 2858 return __ret; 2859 } 2860 #else 2861 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vminq_f16(float16x8_t __p0, float16x8_t __p1) { 2862 float16x8_t __ret; 2863 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 2864 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 2865 __ret = (float16x8_t) __builtin_neon_vminq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40); 2866 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 2867 return __ret; 2868 } 2869 #endif 2870 2871 #ifdef __LITTLE_ENDIAN__ 2872 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vmin_f16(float16x4_t __p0, float16x4_t __p1) { 2873 float16x4_t __ret; 2874 __ret = (float16x4_t) __builtin_neon_vmin_f16((int8x8_t)__p0, (int8x8_t)__p1, 8); 2875 return __ret; 2876 } 2877 #else 2878 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vmin_f16(float16x4_t __p0, float16x4_t __p1) { 2879 float16x4_t __ret; 2880 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 2881 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 2882 __ret = (float16x4_t) __builtin_neon_vmin_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8); 2883 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 2884 return __ret; 2885 } 2886 #endif 2887 2888 #ifdef __LITTLE_ENDIAN__ 2889 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vmulq_f16(float16x8_t __p0, float16x8_t __p1) { 2890 float16x8_t __ret; 2891 __ret = __p0 * __p1; 2892 return __ret; 2893 } 2894 #else 2895 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vmulq_f16(float16x8_t __p0, float16x8_t __p1) { 2896 float16x8_t __ret; 2897 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 2898 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 2899 __ret = __rev0 * __rev1; 2900 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 2901 return __ret; 2902 } 2903 #endif 2904 2905 #ifdef __LITTLE_ENDIAN__ 2906 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vmul_f16(float16x4_t __p0, float16x4_t __p1) { 2907 float16x4_t __ret; 2908 __ret = __p0 * __p1; 2909 return __ret; 2910 } 2911 #else 2912 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vmul_f16(float16x4_t __p0, float16x4_t __p1) { 2913 float16x4_t __ret; 2914 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 2915 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 2916 __ret = __rev0 * __rev1; 2917 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 2918 return __ret; 2919 } 2920 #endif 2921 2922 #ifdef __LITTLE_ENDIAN__ 2923 #define vmulq_n_f16(__p0, __p1) __extension__ ({ \ 2924 float16x8_t __ret; \ 2925 float16x8_t __s0 = __p0; \ 2926 float16_t __s1 = __p1; \ 2927 __ret = __s0 * (float16x8_t) {__s1, __s1, __s1, __s1, __s1, __s1, __s1, __s1}; \ 2928 __ret; \ 2929 }) 2930 #else 2931 #define vmulq_n_f16(__p0, __p1) __extension__ ({ \ 2932 float16x8_t __ret; \ 2933 float16x8_t __s0 = __p0; \ 2934 float16_t __s1 = __p1; \ 2935 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 2936 __ret = __rev0 * (float16x8_t) {__s1, __s1, __s1, __s1, __s1, __s1, __s1, __s1}; \ 2937 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 2938 __ret; \ 2939 }) 2940 #endif 2941 2942 #ifdef __LITTLE_ENDIAN__ 2943 #define vmul_n_f16(__p0, __p1) __extension__ ({ \ 2944 float16x4_t __ret; \ 2945 float16x4_t __s0 = __p0; \ 2946 float16_t __s1 = __p1; \ 2947 __ret = __s0 * (float16x4_t) {__s1, __s1, __s1, __s1}; \ 2948 __ret; \ 2949 }) 2950 #else 2951 #define vmul_n_f16(__p0, __p1) __extension__ ({ \ 2952 float16x4_t __ret; \ 2953 float16x4_t __s0 = __p0; \ 2954 float16_t __s1 = __p1; \ 2955 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 2956 __ret = __rev0 * (float16x4_t) {__s1, __s1, __s1, __s1}; \ 2957 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 2958 __ret; \ 2959 }) 2960 #endif 2961 2962 #ifdef __LITTLE_ENDIAN__ 2963 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vnegq_f16(float16x8_t __p0) { 2964 float16x8_t __ret; 2965 __ret = -__p0; 2966 return __ret; 2967 } 2968 #else 2969 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vnegq_f16(float16x8_t __p0) { 2970 float16x8_t __ret; 2971 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 2972 __ret = -__rev0; 2973 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 2974 return __ret; 2975 } 2976 #endif 2977 2978 #ifdef __LITTLE_ENDIAN__ 2979 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vneg_f16(float16x4_t __p0) { 2980 float16x4_t __ret; 2981 __ret = -__p0; 2982 return __ret; 2983 } 2984 #else 2985 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vneg_f16(float16x4_t __p0) { 2986 float16x4_t __ret; 2987 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 2988 __ret = -__rev0; 2989 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 2990 return __ret; 2991 } 2992 #endif 2993 2994 #ifdef __LITTLE_ENDIAN__ 2995 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vpadd_f16(float16x4_t __p0, float16x4_t __p1) { 2996 float16x4_t __ret; 2997 __ret = (float16x4_t) __builtin_neon_vpadd_f16((int8x8_t)__p0, (int8x8_t)__p1, 8); 2998 return __ret; 2999 } 3000 #else 3001 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vpadd_f16(float16x4_t __p0, float16x4_t __p1) { 3002 float16x4_t __ret; 3003 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 3004 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 3005 __ret = (float16x4_t) __builtin_neon_vpadd_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8); 3006 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 3007 return __ret; 3008 } 3009 #endif 3010 3011 #ifdef __LITTLE_ENDIAN__ 3012 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vpmax_f16(float16x4_t __p0, float16x4_t __p1) { 3013 float16x4_t __ret; 3014 __ret = (float16x4_t) __builtin_neon_vpmax_f16((int8x8_t)__p0, (int8x8_t)__p1, 8); 3015 return __ret; 3016 } 3017 #else 3018 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vpmax_f16(float16x4_t __p0, float16x4_t __p1) { 3019 float16x4_t __ret; 3020 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 3021 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 3022 __ret = (float16x4_t) __builtin_neon_vpmax_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8); 3023 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 3024 return __ret; 3025 } 3026 #endif 3027 3028 #ifdef __LITTLE_ENDIAN__ 3029 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vpmin_f16(float16x4_t __p0, float16x4_t __p1) { 3030 float16x4_t __ret; 3031 __ret = (float16x4_t) __builtin_neon_vpmin_f16((int8x8_t)__p0, (int8x8_t)__p1, 8); 3032 return __ret; 3033 } 3034 #else 3035 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vpmin_f16(float16x4_t __p0, float16x4_t __p1) { 3036 float16x4_t __ret; 3037 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 3038 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 3039 __ret = (float16x4_t) __builtin_neon_vpmin_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8); 3040 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 3041 return __ret; 3042 } 3043 #endif 3044 3045 #ifdef __LITTLE_ENDIAN__ 3046 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrecpeq_f16(float16x8_t __p0) { 3047 float16x8_t __ret; 3048 __ret = (float16x8_t) __builtin_neon_vrecpeq_f16((int8x16_t)__p0, 40); 3049 return __ret; 3050 } 3051 #else 3052 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrecpeq_f16(float16x8_t __p0) { 3053 float16x8_t __ret; 3054 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 3055 __ret = (float16x8_t) __builtin_neon_vrecpeq_f16((int8x16_t)__rev0, 40); 3056 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 3057 return __ret; 3058 } 3059 #endif 3060 3061 #ifdef __LITTLE_ENDIAN__ 3062 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrecpe_f16(float16x4_t __p0) { 3063 float16x4_t __ret; 3064 __ret = (float16x4_t) __builtin_neon_vrecpe_f16((int8x8_t)__p0, 8); 3065 return __ret; 3066 } 3067 #else 3068 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrecpe_f16(float16x4_t __p0) { 3069 float16x4_t __ret; 3070 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 3071 __ret = (float16x4_t) __builtin_neon_vrecpe_f16((int8x8_t)__rev0, 8); 3072 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 3073 return __ret; 3074 } 3075 #endif 3076 3077 #ifdef __LITTLE_ENDIAN__ 3078 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrecpsq_f16(float16x8_t __p0, float16x8_t __p1) { 3079 float16x8_t __ret; 3080 __ret = (float16x8_t) __builtin_neon_vrecpsq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40); 3081 return __ret; 3082 } 3083 #else 3084 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrecpsq_f16(float16x8_t __p0, float16x8_t __p1) { 3085 float16x8_t __ret; 3086 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 3087 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 3088 __ret = (float16x8_t) __builtin_neon_vrecpsq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40); 3089 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 3090 return __ret; 3091 } 3092 #endif 3093 3094 #ifdef __LITTLE_ENDIAN__ 3095 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrecps_f16(float16x4_t __p0, float16x4_t __p1) { 3096 float16x4_t __ret; 3097 __ret = (float16x4_t) __builtin_neon_vrecps_f16((int8x8_t)__p0, (int8x8_t)__p1, 8); 3098 return __ret; 3099 } 3100 #else 3101 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrecps_f16(float16x4_t __p0, float16x4_t __p1) { 3102 float16x4_t __ret; 3103 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 3104 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 3105 __ret = (float16x4_t) __builtin_neon_vrecps_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8); 3106 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 3107 return __ret; 3108 } 3109 #endif 3110 3111 #ifdef __LITTLE_ENDIAN__ 3112 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrsqrteq_f16(float16x8_t __p0) { 3113 float16x8_t __ret; 3114 __ret = (float16x8_t) __builtin_neon_vrsqrteq_f16((int8x16_t)__p0, 40); 3115 return __ret; 3116 } 3117 #else 3118 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrsqrteq_f16(float16x8_t __p0) { 3119 float16x8_t __ret; 3120 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 3121 __ret = (float16x8_t) __builtin_neon_vrsqrteq_f16((int8x16_t)__rev0, 40); 3122 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 3123 return __ret; 3124 } 3125 #endif 3126 3127 #ifdef __LITTLE_ENDIAN__ 3128 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrsqrte_f16(float16x4_t __p0) { 3129 float16x4_t __ret; 3130 __ret = (float16x4_t) __builtin_neon_vrsqrte_f16((int8x8_t)__p0, 8); 3131 return __ret; 3132 } 3133 #else 3134 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrsqrte_f16(float16x4_t __p0) { 3135 float16x4_t __ret; 3136 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 3137 __ret = (float16x4_t) __builtin_neon_vrsqrte_f16((int8x8_t)__rev0, 8); 3138 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 3139 return __ret; 3140 } 3141 #endif 3142 3143 #ifdef __LITTLE_ENDIAN__ 3144 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrsqrtsq_f16(float16x8_t __p0, float16x8_t __p1) { 3145 float16x8_t __ret; 3146 __ret = (float16x8_t) __builtin_neon_vrsqrtsq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40); 3147 return __ret; 3148 } 3149 #else 3150 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrsqrtsq_f16(float16x8_t __p0, float16x8_t __p1) { 3151 float16x8_t __ret; 3152 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 3153 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 3154 __ret = (float16x8_t) __builtin_neon_vrsqrtsq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40); 3155 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 3156 return __ret; 3157 } 3158 #endif 3159 3160 #ifdef __LITTLE_ENDIAN__ 3161 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrsqrts_f16(float16x4_t __p0, float16x4_t __p1) { 3162 float16x4_t __ret; 3163 __ret = (float16x4_t) __builtin_neon_vrsqrts_f16((int8x8_t)__p0, (int8x8_t)__p1, 8); 3164 return __ret; 3165 } 3166 #else 3167 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrsqrts_f16(float16x4_t __p0, float16x4_t __p1) { 3168 float16x4_t __ret; 3169 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 3170 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 3171 __ret = (float16x4_t) __builtin_neon_vrsqrts_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8); 3172 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 3173 return __ret; 3174 } 3175 #endif 3176 3177 #ifdef __LITTLE_ENDIAN__ 3178 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vsubq_f16(float16x8_t __p0, float16x8_t __p1) { 3179 float16x8_t __ret; 3180 __ret = __p0 - __p1; 3181 return __ret; 3182 } 3183 #else 3184 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vsubq_f16(float16x8_t __p0, float16x8_t __p1) { 3185 float16x8_t __ret; 3186 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 3187 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 3188 __ret = __rev0 - __rev1; 3189 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 3190 return __ret; 3191 } 3192 #endif 3193 3194 #ifdef __LITTLE_ENDIAN__ 3195 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vsub_f16(float16x4_t __p0, float16x4_t __p1) { 3196 float16x4_t __ret; 3197 __ret = __p0 - __p1; 3198 return __ret; 3199 } 3200 #else 3201 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vsub_f16(float16x4_t __p0, float16x4_t __p1) { 3202 float16x4_t __ret; 3203 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 3204 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 3205 __ret = __rev0 - __rev1; 3206 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 3207 return __ret; 3208 } 3209 #endif 3210 3211 #ifdef __LITTLE_ENDIAN__ 3212 __ai __attribute__((target("i8mm,neon"))) uint32x4_t vmmlaq_u32(uint32x4_t __p0, uint8x16_t __p1, uint8x16_t __p2) { 3213 uint32x4_t __ret; 3214 __ret = (uint32x4_t) __builtin_neon_vmmlaq_u32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 50); 3215 return __ret; 3216 } 3217 #else 3218 __ai __attribute__((target("i8mm,neon"))) uint32x4_t vmmlaq_u32(uint32x4_t __p0, uint8x16_t __p1, uint8x16_t __p2) { 3219 uint32x4_t __ret; 3220 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 3221 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 3222 uint8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 3223 __ret = (uint32x4_t) __builtin_neon_vmmlaq_u32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 50); 3224 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 3225 return __ret; 3226 } 3227 #endif 3228 3229 #ifdef __LITTLE_ENDIAN__ 3230 __ai __attribute__((target("i8mm,neon"))) int32x4_t vmmlaq_s32(int32x4_t __p0, int8x16_t __p1, int8x16_t __p2) { 3231 int32x4_t __ret; 3232 __ret = (int32x4_t) __builtin_neon_vmmlaq_s32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 34); 3233 return __ret; 3234 } 3235 #else 3236 __ai __attribute__((target("i8mm,neon"))) int32x4_t vmmlaq_s32(int32x4_t __p0, int8x16_t __p1, int8x16_t __p2) { 3237 int32x4_t __ret; 3238 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 3239 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 3240 int8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 3241 __ret = (int32x4_t) __builtin_neon_vmmlaq_s32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 34); 3242 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 3243 return __ret; 3244 } 3245 #endif 3246 3247 #ifdef __LITTLE_ENDIAN__ 3248 __ai __attribute__((target("i8mm,neon"))) int32x4_t vusdotq_s32(int32x4_t __p0, uint8x16_t __p1, int8x16_t __p2) { 3249 int32x4_t __ret; 3250 __ret = (int32x4_t) __builtin_neon_vusdotq_s32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 34); 3251 return __ret; 3252 } 3253 #else 3254 __ai __attribute__((target("i8mm,neon"))) int32x4_t vusdotq_s32(int32x4_t __p0, uint8x16_t __p1, int8x16_t __p2) { 3255 int32x4_t __ret; 3256 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 3257 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 3258 int8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 3259 __ret = (int32x4_t) __builtin_neon_vusdotq_s32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 34); 3260 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 3261 return __ret; 3262 } 3263 __ai __attribute__((target("i8mm,neon"))) int32x4_t __noswap_vusdotq_s32(int32x4_t __p0, uint8x16_t __p1, int8x16_t __p2) { 3264 int32x4_t __ret; 3265 __ret = (int32x4_t) __builtin_neon_vusdotq_s32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 34); 3266 return __ret; 3267 } 3268 #endif 3269 3270 #ifdef __LITTLE_ENDIAN__ 3271 __ai __attribute__((target("i8mm,neon"))) int32x2_t vusdot_s32(int32x2_t __p0, uint8x8_t __p1, int8x8_t __p2) { 3272 int32x2_t __ret; 3273 __ret = (int32x2_t) __builtin_neon_vusdot_s32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 2); 3274 return __ret; 3275 } 3276 #else 3277 __ai __attribute__((target("i8mm,neon"))) int32x2_t vusdot_s32(int32x2_t __p0, uint8x8_t __p1, int8x8_t __p2) { 3278 int32x2_t __ret; 3279 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 3280 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 3281 int8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 3282 __ret = (int32x2_t) __builtin_neon_vusdot_s32((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 2); 3283 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 3284 return __ret; 3285 } 3286 __ai __attribute__((target("i8mm,neon"))) int32x2_t __noswap_vusdot_s32(int32x2_t __p0, uint8x8_t __p1, int8x8_t __p2) { 3287 int32x2_t __ret; 3288 __ret = (int32x2_t) __builtin_neon_vusdot_s32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 2); 3289 return __ret; 3290 } 3291 #endif 3292 3293 #ifdef __LITTLE_ENDIAN__ 3294 __ai __attribute__((target("i8mm,neon"))) int32x4_t vusmmlaq_s32(int32x4_t __p0, uint8x16_t __p1, int8x16_t __p2) { 3295 int32x4_t __ret; 3296 __ret = (int32x4_t) __builtin_neon_vusmmlaq_s32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 34); 3297 return __ret; 3298 } 3299 #else 3300 __ai __attribute__((target("i8mm,neon"))) int32x4_t vusmmlaq_s32(int32x4_t __p0, uint8x16_t __p1, int8x16_t __p2) { 3301 int32x4_t __ret; 3302 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 3303 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 3304 int8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 3305 __ret = (int32x4_t) __builtin_neon_vusmmlaq_s32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 34); 3306 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 3307 return __ret; 3308 } 3309 #endif 3310 3311 #ifdef __LITTLE_ENDIAN__ 3312 #define splat_lane_p8(__p0, __p1) __extension__ ({ \ 3313 poly8x8_t __ret; \ 3314 poly8x8_t __s0 = __p0; \ 3315 __ret = (poly8x8_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 4); \ 3316 __ret; \ 3317 }) 3318 #else 3319 #define splat_lane_p8(__p0, __p1) __extension__ ({ \ 3320 poly8x8_t __ret; \ 3321 poly8x8_t __s0 = __p0; \ 3322 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 3323 __ret = (poly8x8_t) __builtin_neon_splat_lane_v((int8x8_t)__rev0, __p1, 4); \ 3324 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 3325 __ret; \ 3326 }) 3327 #define __noswap_splat_lane_p8(__p0, __p1) __extension__ ({ \ 3328 poly8x8_t __ret; \ 3329 poly8x8_t __s0 = __p0; \ 3330 __ret = (poly8x8_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 4); \ 3331 __ret; \ 3332 }) 3333 #endif 3334 3335 #define splat_lane_p64(__p0, __p1) __extension__ ({ \ 3336 poly64x1_t __ret; \ 3337 poly64x1_t __s0 = __p0; \ 3338 __ret = (poly64x1_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 6); \ 3339 __ret; \ 3340 }) 3341 #ifdef __LITTLE_ENDIAN__ 3342 #define splat_lane_p16(__p0, __p1) __extension__ ({ \ 3343 poly16x4_t __ret; \ 3344 poly16x4_t __s0 = __p0; \ 3345 __ret = (poly16x4_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 5); \ 3346 __ret; \ 3347 }) 3348 #else 3349 #define splat_lane_p16(__p0, __p1) __extension__ ({ \ 3350 poly16x4_t __ret; \ 3351 poly16x4_t __s0 = __p0; \ 3352 poly16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 3353 __ret = (poly16x4_t) __builtin_neon_splat_lane_v((int8x8_t)__rev0, __p1, 5); \ 3354 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 3355 __ret; \ 3356 }) 3357 #define __noswap_splat_lane_p16(__p0, __p1) __extension__ ({ \ 3358 poly16x4_t __ret; \ 3359 poly16x4_t __s0 = __p0; \ 3360 __ret = (poly16x4_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 5); \ 3361 __ret; \ 3362 }) 3363 #endif 3364 3365 #ifdef __LITTLE_ENDIAN__ 3366 #define splatq_lane_p8(__p0, __p1) __extension__ ({ \ 3367 poly8x16_t __ret; \ 3368 poly8x8_t __s0 = __p0; \ 3369 __ret = (poly8x16_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 4); \ 3370 __ret; \ 3371 }) 3372 #else 3373 #define splatq_lane_p8(__p0, __p1) __extension__ ({ \ 3374 poly8x16_t __ret; \ 3375 poly8x8_t __s0 = __p0; \ 3376 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 3377 __ret = (poly8x16_t) __builtin_neon_splatq_lane_v((int8x8_t)__rev0, __p1, 4); \ 3378 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 3379 __ret; \ 3380 }) 3381 #define __noswap_splatq_lane_p8(__p0, __p1) __extension__ ({ \ 3382 poly8x16_t __ret; \ 3383 poly8x8_t __s0 = __p0; \ 3384 __ret = (poly8x16_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 4); \ 3385 __ret; \ 3386 }) 3387 #endif 3388 3389 #ifdef __LITTLE_ENDIAN__ 3390 #define splatq_lane_p64(__p0, __p1) __extension__ ({ \ 3391 poly64x2_t __ret; \ 3392 poly64x1_t __s0 = __p0; \ 3393 __ret = (poly64x2_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 6); \ 3394 __ret; \ 3395 }) 3396 #else 3397 #define splatq_lane_p64(__p0, __p1) __extension__ ({ \ 3398 poly64x2_t __ret; \ 3399 poly64x1_t __s0 = __p0; \ 3400 __ret = (poly64x2_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 6); \ 3401 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 3402 __ret; \ 3403 }) 3404 #define __noswap_splatq_lane_p64(__p0, __p1) __extension__ ({ \ 3405 poly64x2_t __ret; \ 3406 poly64x1_t __s0 = __p0; \ 3407 __ret = (poly64x2_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 6); \ 3408 __ret; \ 3409 }) 3410 #endif 3411 3412 #ifdef __LITTLE_ENDIAN__ 3413 #define splatq_lane_p16(__p0, __p1) __extension__ ({ \ 3414 poly16x8_t __ret; \ 3415 poly16x4_t __s0 = __p0; \ 3416 __ret = (poly16x8_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 5); \ 3417 __ret; \ 3418 }) 3419 #else 3420 #define splatq_lane_p16(__p0, __p1) __extension__ ({ \ 3421 poly16x8_t __ret; \ 3422 poly16x4_t __s0 = __p0; \ 3423 poly16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 3424 __ret = (poly16x8_t) __builtin_neon_splatq_lane_v((int8x8_t)__rev0, __p1, 5); \ 3425 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 3426 __ret; \ 3427 }) 3428 #define __noswap_splatq_lane_p16(__p0, __p1) __extension__ ({ \ 3429 poly16x8_t __ret; \ 3430 poly16x4_t __s0 = __p0; \ 3431 __ret = (poly16x8_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 5); \ 3432 __ret; \ 3433 }) 3434 #endif 3435 3436 #ifdef __LITTLE_ENDIAN__ 3437 #define splatq_lane_u8(__p0, __p1) __extension__ ({ \ 3438 uint8x16_t __ret; \ 3439 uint8x8_t __s0 = __p0; \ 3440 __ret = (uint8x16_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 16); \ 3441 __ret; \ 3442 }) 3443 #else 3444 #define splatq_lane_u8(__p0, __p1) __extension__ ({ \ 3445 uint8x16_t __ret; \ 3446 uint8x8_t __s0 = __p0; \ 3447 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 3448 __ret = (uint8x16_t) __builtin_neon_splatq_lane_v((int8x8_t)__rev0, __p1, 16); \ 3449 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 3450 __ret; \ 3451 }) 3452 #define __noswap_splatq_lane_u8(__p0, __p1) __extension__ ({ \ 3453 uint8x16_t __ret; \ 3454 uint8x8_t __s0 = __p0; \ 3455 __ret = (uint8x16_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 16); \ 3456 __ret; \ 3457 }) 3458 #endif 3459 3460 #ifdef __LITTLE_ENDIAN__ 3461 #define splatq_lane_u32(__p0, __p1) __extension__ ({ \ 3462 uint32x4_t __ret; \ 3463 uint32x2_t __s0 = __p0; \ 3464 __ret = (uint32x4_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 18); \ 3465 __ret; \ 3466 }) 3467 #else 3468 #define splatq_lane_u32(__p0, __p1) __extension__ ({ \ 3469 uint32x4_t __ret; \ 3470 uint32x2_t __s0 = __p0; \ 3471 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 3472 __ret = (uint32x4_t) __builtin_neon_splatq_lane_v((int8x8_t)__rev0, __p1, 18); \ 3473 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 3474 __ret; \ 3475 }) 3476 #define __noswap_splatq_lane_u32(__p0, __p1) __extension__ ({ \ 3477 uint32x4_t __ret; \ 3478 uint32x2_t __s0 = __p0; \ 3479 __ret = (uint32x4_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 18); \ 3480 __ret; \ 3481 }) 3482 #endif 3483 3484 #ifdef __LITTLE_ENDIAN__ 3485 #define splatq_lane_u64(__p0, __p1) __extension__ ({ \ 3486 uint64x2_t __ret; \ 3487 uint64x1_t __s0 = __p0; \ 3488 __ret = (uint64x2_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 19); \ 3489 __ret; \ 3490 }) 3491 #else 3492 #define splatq_lane_u64(__p0, __p1) __extension__ ({ \ 3493 uint64x2_t __ret; \ 3494 uint64x1_t __s0 = __p0; \ 3495 __ret = (uint64x2_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 19); \ 3496 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 3497 __ret; \ 3498 }) 3499 #define __noswap_splatq_lane_u64(__p0, __p1) __extension__ ({ \ 3500 uint64x2_t __ret; \ 3501 uint64x1_t __s0 = __p0; \ 3502 __ret = (uint64x2_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 19); \ 3503 __ret; \ 3504 }) 3505 #endif 3506 3507 #ifdef __LITTLE_ENDIAN__ 3508 #define splatq_lane_u16(__p0, __p1) __extension__ ({ \ 3509 uint16x8_t __ret; \ 3510 uint16x4_t __s0 = __p0; \ 3511 __ret = (uint16x8_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 17); \ 3512 __ret; \ 3513 }) 3514 #else 3515 #define splatq_lane_u16(__p0, __p1) __extension__ ({ \ 3516 uint16x8_t __ret; \ 3517 uint16x4_t __s0 = __p0; \ 3518 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 3519 __ret = (uint16x8_t) __builtin_neon_splatq_lane_v((int8x8_t)__rev0, __p1, 17); \ 3520 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 3521 __ret; \ 3522 }) 3523 #define __noswap_splatq_lane_u16(__p0, __p1) __extension__ ({ \ 3524 uint16x8_t __ret; \ 3525 uint16x4_t __s0 = __p0; \ 3526 __ret = (uint16x8_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 17); \ 3527 __ret; \ 3528 }) 3529 #endif 3530 3531 #ifdef __LITTLE_ENDIAN__ 3532 #define splatq_lane_s8(__p0, __p1) __extension__ ({ \ 3533 int8x16_t __ret; \ 3534 int8x8_t __s0 = __p0; \ 3535 __ret = (int8x16_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 0); \ 3536 __ret; \ 3537 }) 3538 #else 3539 #define splatq_lane_s8(__p0, __p1) __extension__ ({ \ 3540 int8x16_t __ret; \ 3541 int8x8_t __s0 = __p0; \ 3542 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 3543 __ret = (int8x16_t) __builtin_neon_splatq_lane_v((int8x8_t)__rev0, __p1, 0); \ 3544 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 3545 __ret; \ 3546 }) 3547 #define __noswap_splatq_lane_s8(__p0, __p1) __extension__ ({ \ 3548 int8x16_t __ret; \ 3549 int8x8_t __s0 = __p0; \ 3550 __ret = (int8x16_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 0); \ 3551 __ret; \ 3552 }) 3553 #endif 3554 3555 #ifdef __LITTLE_ENDIAN__ 3556 #define splatq_lane_f64(__p0, __p1) __extension__ ({ \ 3557 float64x2_t __ret; \ 3558 float64x1_t __s0 = __p0; \ 3559 __ret = (float64x2_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 10); \ 3560 __ret; \ 3561 }) 3562 #else 3563 #define splatq_lane_f64(__p0, __p1) __extension__ ({ \ 3564 float64x2_t __ret; \ 3565 float64x1_t __s0 = __p0; \ 3566 __ret = (float64x2_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 10); \ 3567 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 3568 __ret; \ 3569 }) 3570 #define __noswap_splatq_lane_f64(__p0, __p1) __extension__ ({ \ 3571 float64x2_t __ret; \ 3572 float64x1_t __s0 = __p0; \ 3573 __ret = (float64x2_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 10); \ 3574 __ret; \ 3575 }) 3576 #endif 3577 3578 #ifdef __LITTLE_ENDIAN__ 3579 #define splatq_lane_f32(__p0, __p1) __extension__ ({ \ 3580 float32x4_t __ret; \ 3581 float32x2_t __s0 = __p0; \ 3582 __ret = (float32x4_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 9); \ 3583 __ret; \ 3584 }) 3585 #else 3586 #define splatq_lane_f32(__p0, __p1) __extension__ ({ \ 3587 float32x4_t __ret; \ 3588 float32x2_t __s0 = __p0; \ 3589 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 3590 __ret = (float32x4_t) __builtin_neon_splatq_lane_v((int8x8_t)__rev0, __p1, 9); \ 3591 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 3592 __ret; \ 3593 }) 3594 #define __noswap_splatq_lane_f32(__p0, __p1) __extension__ ({ \ 3595 float32x4_t __ret; \ 3596 float32x2_t __s0 = __p0; \ 3597 __ret = (float32x4_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 9); \ 3598 __ret; \ 3599 }) 3600 #endif 3601 3602 #ifdef __LITTLE_ENDIAN__ 3603 #define splatq_lane_f16(__p0, __p1) __extension__ ({ \ 3604 float16x8_t __ret; \ 3605 float16x4_t __s0 = __p0; \ 3606 __ret = (float16x8_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 8); \ 3607 __ret; \ 3608 }) 3609 #else 3610 #define splatq_lane_f16(__p0, __p1) __extension__ ({ \ 3611 float16x8_t __ret; \ 3612 float16x4_t __s0 = __p0; \ 3613 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 3614 __ret = (float16x8_t) __builtin_neon_splatq_lane_v((int8x8_t)__rev0, __p1, 8); \ 3615 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 3616 __ret; \ 3617 }) 3618 #define __noswap_splatq_lane_f16(__p0, __p1) __extension__ ({ \ 3619 float16x8_t __ret; \ 3620 float16x4_t __s0 = __p0; \ 3621 __ret = (float16x8_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 8); \ 3622 __ret; \ 3623 }) 3624 #endif 3625 3626 #ifdef __LITTLE_ENDIAN__ 3627 #define splatq_lane_s32(__p0, __p1) __extension__ ({ \ 3628 int32x4_t __ret; \ 3629 int32x2_t __s0 = __p0; \ 3630 __ret = (int32x4_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 2); \ 3631 __ret; \ 3632 }) 3633 #else 3634 #define splatq_lane_s32(__p0, __p1) __extension__ ({ \ 3635 int32x4_t __ret; \ 3636 int32x2_t __s0 = __p0; \ 3637 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 3638 __ret = (int32x4_t) __builtin_neon_splatq_lane_v((int8x8_t)__rev0, __p1, 2); \ 3639 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 3640 __ret; \ 3641 }) 3642 #define __noswap_splatq_lane_s32(__p0, __p1) __extension__ ({ \ 3643 int32x4_t __ret; \ 3644 int32x2_t __s0 = __p0; \ 3645 __ret = (int32x4_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 2); \ 3646 __ret; \ 3647 }) 3648 #endif 3649 3650 #ifdef __LITTLE_ENDIAN__ 3651 #define splatq_lane_s64(__p0, __p1) __extension__ ({ \ 3652 int64x2_t __ret; \ 3653 int64x1_t __s0 = __p0; \ 3654 __ret = (int64x2_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 3); \ 3655 __ret; \ 3656 }) 3657 #else 3658 #define splatq_lane_s64(__p0, __p1) __extension__ ({ \ 3659 int64x2_t __ret; \ 3660 int64x1_t __s0 = __p0; \ 3661 __ret = (int64x2_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 3); \ 3662 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 3663 __ret; \ 3664 }) 3665 #define __noswap_splatq_lane_s64(__p0, __p1) __extension__ ({ \ 3666 int64x2_t __ret; \ 3667 int64x1_t __s0 = __p0; \ 3668 __ret = (int64x2_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 3); \ 3669 __ret; \ 3670 }) 3671 #endif 3672 3673 #ifdef __LITTLE_ENDIAN__ 3674 #define splatq_lane_s16(__p0, __p1) __extension__ ({ \ 3675 int16x8_t __ret; \ 3676 int16x4_t __s0 = __p0; \ 3677 __ret = (int16x8_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 1); \ 3678 __ret; \ 3679 }) 3680 #else 3681 #define splatq_lane_s16(__p0, __p1) __extension__ ({ \ 3682 int16x8_t __ret; \ 3683 int16x4_t __s0 = __p0; \ 3684 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 3685 __ret = (int16x8_t) __builtin_neon_splatq_lane_v((int8x8_t)__rev0, __p1, 1); \ 3686 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 3687 __ret; \ 3688 }) 3689 #define __noswap_splatq_lane_s16(__p0, __p1) __extension__ ({ \ 3690 int16x8_t __ret; \ 3691 int16x4_t __s0 = __p0; \ 3692 __ret = (int16x8_t) __builtin_neon_splatq_lane_v((int8x8_t)__s0, __p1, 1); \ 3693 __ret; \ 3694 }) 3695 #endif 3696 3697 #ifdef __LITTLE_ENDIAN__ 3698 #define splat_lane_u8(__p0, __p1) __extension__ ({ \ 3699 uint8x8_t __ret; \ 3700 uint8x8_t __s0 = __p0; \ 3701 __ret = (uint8x8_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 16); \ 3702 __ret; \ 3703 }) 3704 #else 3705 #define splat_lane_u8(__p0, __p1) __extension__ ({ \ 3706 uint8x8_t __ret; \ 3707 uint8x8_t __s0 = __p0; \ 3708 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 3709 __ret = (uint8x8_t) __builtin_neon_splat_lane_v((int8x8_t)__rev0, __p1, 16); \ 3710 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 3711 __ret; \ 3712 }) 3713 #define __noswap_splat_lane_u8(__p0, __p1) __extension__ ({ \ 3714 uint8x8_t __ret; \ 3715 uint8x8_t __s0 = __p0; \ 3716 __ret = (uint8x8_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 16); \ 3717 __ret; \ 3718 }) 3719 #endif 3720 3721 #ifdef __LITTLE_ENDIAN__ 3722 #define splat_lane_u32(__p0, __p1) __extension__ ({ \ 3723 uint32x2_t __ret; \ 3724 uint32x2_t __s0 = __p0; \ 3725 __ret = (uint32x2_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 18); \ 3726 __ret; \ 3727 }) 3728 #else 3729 #define splat_lane_u32(__p0, __p1) __extension__ ({ \ 3730 uint32x2_t __ret; \ 3731 uint32x2_t __s0 = __p0; \ 3732 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 3733 __ret = (uint32x2_t) __builtin_neon_splat_lane_v((int8x8_t)__rev0, __p1, 18); \ 3734 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 3735 __ret; \ 3736 }) 3737 #define __noswap_splat_lane_u32(__p0, __p1) __extension__ ({ \ 3738 uint32x2_t __ret; \ 3739 uint32x2_t __s0 = __p0; \ 3740 __ret = (uint32x2_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 18); \ 3741 __ret; \ 3742 }) 3743 #endif 3744 3745 #define splat_lane_u64(__p0, __p1) __extension__ ({ \ 3746 uint64x1_t __ret; \ 3747 uint64x1_t __s0 = __p0; \ 3748 __ret = (uint64x1_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 19); \ 3749 __ret; \ 3750 }) 3751 #ifdef __LITTLE_ENDIAN__ 3752 #define splat_lane_u16(__p0, __p1) __extension__ ({ \ 3753 uint16x4_t __ret; \ 3754 uint16x4_t __s0 = __p0; \ 3755 __ret = (uint16x4_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 17); \ 3756 __ret; \ 3757 }) 3758 #else 3759 #define splat_lane_u16(__p0, __p1) __extension__ ({ \ 3760 uint16x4_t __ret; \ 3761 uint16x4_t __s0 = __p0; \ 3762 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 3763 __ret = (uint16x4_t) __builtin_neon_splat_lane_v((int8x8_t)__rev0, __p1, 17); \ 3764 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 3765 __ret; \ 3766 }) 3767 #define __noswap_splat_lane_u16(__p0, __p1) __extension__ ({ \ 3768 uint16x4_t __ret; \ 3769 uint16x4_t __s0 = __p0; \ 3770 __ret = (uint16x4_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 17); \ 3771 __ret; \ 3772 }) 3773 #endif 3774 3775 #ifdef __LITTLE_ENDIAN__ 3776 #define splat_lane_s8(__p0, __p1) __extension__ ({ \ 3777 int8x8_t __ret; \ 3778 int8x8_t __s0 = __p0; \ 3779 __ret = (int8x8_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 0); \ 3780 __ret; \ 3781 }) 3782 #else 3783 #define splat_lane_s8(__p0, __p1) __extension__ ({ \ 3784 int8x8_t __ret; \ 3785 int8x8_t __s0 = __p0; \ 3786 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 3787 __ret = (int8x8_t) __builtin_neon_splat_lane_v((int8x8_t)__rev0, __p1, 0); \ 3788 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 3789 __ret; \ 3790 }) 3791 #define __noswap_splat_lane_s8(__p0, __p1) __extension__ ({ \ 3792 int8x8_t __ret; \ 3793 int8x8_t __s0 = __p0; \ 3794 __ret = (int8x8_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 0); \ 3795 __ret; \ 3796 }) 3797 #endif 3798 3799 #define splat_lane_f64(__p0, __p1) __extension__ ({ \ 3800 float64x1_t __ret; \ 3801 float64x1_t __s0 = __p0; \ 3802 __ret = (float64x1_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 10); \ 3803 __ret; \ 3804 }) 3805 #ifdef __LITTLE_ENDIAN__ 3806 #define splat_lane_f32(__p0, __p1) __extension__ ({ \ 3807 float32x2_t __ret; \ 3808 float32x2_t __s0 = __p0; \ 3809 __ret = (float32x2_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 9); \ 3810 __ret; \ 3811 }) 3812 #else 3813 #define splat_lane_f32(__p0, __p1) __extension__ ({ \ 3814 float32x2_t __ret; \ 3815 float32x2_t __s0 = __p0; \ 3816 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 3817 __ret = (float32x2_t) __builtin_neon_splat_lane_v((int8x8_t)__rev0, __p1, 9); \ 3818 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 3819 __ret; \ 3820 }) 3821 #define __noswap_splat_lane_f32(__p0, __p1) __extension__ ({ \ 3822 float32x2_t __ret; \ 3823 float32x2_t __s0 = __p0; \ 3824 __ret = (float32x2_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 9); \ 3825 __ret; \ 3826 }) 3827 #endif 3828 3829 #ifdef __LITTLE_ENDIAN__ 3830 #define splat_lane_f16(__p0, __p1) __extension__ ({ \ 3831 float16x4_t __ret; \ 3832 float16x4_t __s0 = __p0; \ 3833 __ret = (float16x4_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 8); \ 3834 __ret; \ 3835 }) 3836 #else 3837 #define splat_lane_f16(__p0, __p1) __extension__ ({ \ 3838 float16x4_t __ret; \ 3839 float16x4_t __s0 = __p0; \ 3840 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 3841 __ret = (float16x4_t) __builtin_neon_splat_lane_v((int8x8_t)__rev0, __p1, 8); \ 3842 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 3843 __ret; \ 3844 }) 3845 #define __noswap_splat_lane_f16(__p0, __p1) __extension__ ({ \ 3846 float16x4_t __ret; \ 3847 float16x4_t __s0 = __p0; \ 3848 __ret = (float16x4_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 8); \ 3849 __ret; \ 3850 }) 3851 #endif 3852 3853 #ifdef __LITTLE_ENDIAN__ 3854 #define splat_lane_s32(__p0, __p1) __extension__ ({ \ 3855 int32x2_t __ret; \ 3856 int32x2_t __s0 = __p0; \ 3857 __ret = (int32x2_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 2); \ 3858 __ret; \ 3859 }) 3860 #else 3861 #define splat_lane_s32(__p0, __p1) __extension__ ({ \ 3862 int32x2_t __ret; \ 3863 int32x2_t __s0 = __p0; \ 3864 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 3865 __ret = (int32x2_t) __builtin_neon_splat_lane_v((int8x8_t)__rev0, __p1, 2); \ 3866 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 3867 __ret; \ 3868 }) 3869 #define __noswap_splat_lane_s32(__p0, __p1) __extension__ ({ \ 3870 int32x2_t __ret; \ 3871 int32x2_t __s0 = __p0; \ 3872 __ret = (int32x2_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 2); \ 3873 __ret; \ 3874 }) 3875 #endif 3876 3877 #define splat_lane_s64(__p0, __p1) __extension__ ({ \ 3878 int64x1_t __ret; \ 3879 int64x1_t __s0 = __p0; \ 3880 __ret = (int64x1_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 3); \ 3881 __ret; \ 3882 }) 3883 #ifdef __LITTLE_ENDIAN__ 3884 #define splat_lane_s16(__p0, __p1) __extension__ ({ \ 3885 int16x4_t __ret; \ 3886 int16x4_t __s0 = __p0; \ 3887 __ret = (int16x4_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 1); \ 3888 __ret; \ 3889 }) 3890 #else 3891 #define splat_lane_s16(__p0, __p1) __extension__ ({ \ 3892 int16x4_t __ret; \ 3893 int16x4_t __s0 = __p0; \ 3894 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 3895 __ret = (int16x4_t) __builtin_neon_splat_lane_v((int8x8_t)__rev0, __p1, 1); \ 3896 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 3897 __ret; \ 3898 }) 3899 #define __noswap_splat_lane_s16(__p0, __p1) __extension__ ({ \ 3900 int16x4_t __ret; \ 3901 int16x4_t __s0 = __p0; \ 3902 __ret = (int16x4_t) __builtin_neon_splat_lane_v((int8x8_t)__s0, __p1, 1); \ 3903 __ret; \ 3904 }) 3905 #endif 3906 3907 #ifdef __LITTLE_ENDIAN__ 3908 #define splat_laneq_p8(__p0, __p1) __extension__ ({ \ 3909 poly8x8_t __ret; \ 3910 poly8x16_t __s0 = __p0; \ 3911 __ret = (poly8x8_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 36); \ 3912 __ret; \ 3913 }) 3914 #else 3915 #define splat_laneq_p8(__p0, __p1) __extension__ ({ \ 3916 poly8x8_t __ret; \ 3917 poly8x16_t __s0 = __p0; \ 3918 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 3919 __ret = (poly8x8_t) __builtin_neon_splat_laneq_v((int8x16_t)__rev0, __p1, 36); \ 3920 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 3921 __ret; \ 3922 }) 3923 #define __noswap_splat_laneq_p8(__p0, __p1) __extension__ ({ \ 3924 poly8x8_t __ret; \ 3925 poly8x16_t __s0 = __p0; \ 3926 __ret = (poly8x8_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 36); \ 3927 __ret; \ 3928 }) 3929 #endif 3930 3931 #ifdef __LITTLE_ENDIAN__ 3932 #define splat_laneq_p64(__p0, __p1) __extension__ ({ \ 3933 poly64x1_t __ret; \ 3934 poly64x2_t __s0 = __p0; \ 3935 __ret = (poly64x1_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 38); \ 3936 __ret; \ 3937 }) 3938 #else 3939 #define splat_laneq_p64(__p0, __p1) __extension__ ({ \ 3940 poly64x1_t __ret; \ 3941 poly64x2_t __s0 = __p0; \ 3942 poly64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 3943 __ret = (poly64x1_t) __builtin_neon_splat_laneq_v((int8x16_t)__rev0, __p1, 38); \ 3944 __ret; \ 3945 }) 3946 #define __noswap_splat_laneq_p64(__p0, __p1) __extension__ ({ \ 3947 poly64x1_t __ret; \ 3948 poly64x2_t __s0 = __p0; \ 3949 __ret = (poly64x1_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 38); \ 3950 __ret; \ 3951 }) 3952 #endif 3953 3954 #ifdef __LITTLE_ENDIAN__ 3955 #define splat_laneq_p16(__p0, __p1) __extension__ ({ \ 3956 poly16x4_t __ret; \ 3957 poly16x8_t __s0 = __p0; \ 3958 __ret = (poly16x4_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 37); \ 3959 __ret; \ 3960 }) 3961 #else 3962 #define splat_laneq_p16(__p0, __p1) __extension__ ({ \ 3963 poly16x4_t __ret; \ 3964 poly16x8_t __s0 = __p0; \ 3965 poly16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 3966 __ret = (poly16x4_t) __builtin_neon_splat_laneq_v((int8x16_t)__rev0, __p1, 37); \ 3967 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 3968 __ret; \ 3969 }) 3970 #define __noswap_splat_laneq_p16(__p0, __p1) __extension__ ({ \ 3971 poly16x4_t __ret; \ 3972 poly16x8_t __s0 = __p0; \ 3973 __ret = (poly16x4_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 37); \ 3974 __ret; \ 3975 }) 3976 #endif 3977 3978 #ifdef __LITTLE_ENDIAN__ 3979 #define splatq_laneq_p8(__p0, __p1) __extension__ ({ \ 3980 poly8x16_t __ret; \ 3981 poly8x16_t __s0 = __p0; \ 3982 __ret = (poly8x16_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 36); \ 3983 __ret; \ 3984 }) 3985 #else 3986 #define splatq_laneq_p8(__p0, __p1) __extension__ ({ \ 3987 poly8x16_t __ret; \ 3988 poly8x16_t __s0 = __p0; \ 3989 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 3990 __ret = (poly8x16_t) __builtin_neon_splatq_laneq_v((int8x16_t)__rev0, __p1, 36); \ 3991 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 3992 __ret; \ 3993 }) 3994 #define __noswap_splatq_laneq_p8(__p0, __p1) __extension__ ({ \ 3995 poly8x16_t __ret; \ 3996 poly8x16_t __s0 = __p0; \ 3997 __ret = (poly8x16_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 36); \ 3998 __ret; \ 3999 }) 4000 #endif 4001 4002 #ifdef __LITTLE_ENDIAN__ 4003 #define splatq_laneq_p64(__p0, __p1) __extension__ ({ \ 4004 poly64x2_t __ret; \ 4005 poly64x2_t __s0 = __p0; \ 4006 __ret = (poly64x2_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 38); \ 4007 __ret; \ 4008 }) 4009 #else 4010 #define splatq_laneq_p64(__p0, __p1) __extension__ ({ \ 4011 poly64x2_t __ret; \ 4012 poly64x2_t __s0 = __p0; \ 4013 poly64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 4014 __ret = (poly64x2_t) __builtin_neon_splatq_laneq_v((int8x16_t)__rev0, __p1, 38); \ 4015 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 4016 __ret; \ 4017 }) 4018 #define __noswap_splatq_laneq_p64(__p0, __p1) __extension__ ({ \ 4019 poly64x2_t __ret; \ 4020 poly64x2_t __s0 = __p0; \ 4021 __ret = (poly64x2_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 38); \ 4022 __ret; \ 4023 }) 4024 #endif 4025 4026 #ifdef __LITTLE_ENDIAN__ 4027 #define splatq_laneq_p16(__p0, __p1) __extension__ ({ \ 4028 poly16x8_t __ret; \ 4029 poly16x8_t __s0 = __p0; \ 4030 __ret = (poly16x8_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 37); \ 4031 __ret; \ 4032 }) 4033 #else 4034 #define splatq_laneq_p16(__p0, __p1) __extension__ ({ \ 4035 poly16x8_t __ret; \ 4036 poly16x8_t __s0 = __p0; \ 4037 poly16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 4038 __ret = (poly16x8_t) __builtin_neon_splatq_laneq_v((int8x16_t)__rev0, __p1, 37); \ 4039 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 4040 __ret; \ 4041 }) 4042 #define __noswap_splatq_laneq_p16(__p0, __p1) __extension__ ({ \ 4043 poly16x8_t __ret; \ 4044 poly16x8_t __s0 = __p0; \ 4045 __ret = (poly16x8_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 37); \ 4046 __ret; \ 4047 }) 4048 #endif 4049 4050 #ifdef __LITTLE_ENDIAN__ 4051 #define splatq_laneq_u8(__p0, __p1) __extension__ ({ \ 4052 uint8x16_t __ret; \ 4053 uint8x16_t __s0 = __p0; \ 4054 __ret = (uint8x16_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 48); \ 4055 __ret; \ 4056 }) 4057 #else 4058 #define splatq_laneq_u8(__p0, __p1) __extension__ ({ \ 4059 uint8x16_t __ret; \ 4060 uint8x16_t __s0 = __p0; \ 4061 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 4062 __ret = (uint8x16_t) __builtin_neon_splatq_laneq_v((int8x16_t)__rev0, __p1, 48); \ 4063 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 4064 __ret; \ 4065 }) 4066 #define __noswap_splatq_laneq_u8(__p0, __p1) __extension__ ({ \ 4067 uint8x16_t __ret; \ 4068 uint8x16_t __s0 = __p0; \ 4069 __ret = (uint8x16_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 48); \ 4070 __ret; \ 4071 }) 4072 #endif 4073 4074 #ifdef __LITTLE_ENDIAN__ 4075 #define splatq_laneq_u32(__p0, __p1) __extension__ ({ \ 4076 uint32x4_t __ret; \ 4077 uint32x4_t __s0 = __p0; \ 4078 __ret = (uint32x4_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 50); \ 4079 __ret; \ 4080 }) 4081 #else 4082 #define splatq_laneq_u32(__p0, __p1) __extension__ ({ \ 4083 uint32x4_t __ret; \ 4084 uint32x4_t __s0 = __p0; \ 4085 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 4086 __ret = (uint32x4_t) __builtin_neon_splatq_laneq_v((int8x16_t)__rev0, __p1, 50); \ 4087 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 4088 __ret; \ 4089 }) 4090 #define __noswap_splatq_laneq_u32(__p0, __p1) __extension__ ({ \ 4091 uint32x4_t __ret; \ 4092 uint32x4_t __s0 = __p0; \ 4093 __ret = (uint32x4_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 50); \ 4094 __ret; \ 4095 }) 4096 #endif 4097 4098 #ifdef __LITTLE_ENDIAN__ 4099 #define splatq_laneq_u64(__p0, __p1) __extension__ ({ \ 4100 uint64x2_t __ret; \ 4101 uint64x2_t __s0 = __p0; \ 4102 __ret = (uint64x2_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 51); \ 4103 __ret; \ 4104 }) 4105 #else 4106 #define splatq_laneq_u64(__p0, __p1) __extension__ ({ \ 4107 uint64x2_t __ret; \ 4108 uint64x2_t __s0 = __p0; \ 4109 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 4110 __ret = (uint64x2_t) __builtin_neon_splatq_laneq_v((int8x16_t)__rev0, __p1, 51); \ 4111 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 4112 __ret; \ 4113 }) 4114 #define __noswap_splatq_laneq_u64(__p0, __p1) __extension__ ({ \ 4115 uint64x2_t __ret; \ 4116 uint64x2_t __s0 = __p0; \ 4117 __ret = (uint64x2_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 51); \ 4118 __ret; \ 4119 }) 4120 #endif 4121 4122 #ifdef __LITTLE_ENDIAN__ 4123 #define splatq_laneq_u16(__p0, __p1) __extension__ ({ \ 4124 uint16x8_t __ret; \ 4125 uint16x8_t __s0 = __p0; \ 4126 __ret = (uint16x8_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 49); \ 4127 __ret; \ 4128 }) 4129 #else 4130 #define splatq_laneq_u16(__p0, __p1) __extension__ ({ \ 4131 uint16x8_t __ret; \ 4132 uint16x8_t __s0 = __p0; \ 4133 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 4134 __ret = (uint16x8_t) __builtin_neon_splatq_laneq_v((int8x16_t)__rev0, __p1, 49); \ 4135 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 4136 __ret; \ 4137 }) 4138 #define __noswap_splatq_laneq_u16(__p0, __p1) __extension__ ({ \ 4139 uint16x8_t __ret; \ 4140 uint16x8_t __s0 = __p0; \ 4141 __ret = (uint16x8_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 49); \ 4142 __ret; \ 4143 }) 4144 #endif 4145 4146 #ifdef __LITTLE_ENDIAN__ 4147 #define splatq_laneq_s8(__p0, __p1) __extension__ ({ \ 4148 int8x16_t __ret; \ 4149 int8x16_t __s0 = __p0; \ 4150 __ret = (int8x16_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 32); \ 4151 __ret; \ 4152 }) 4153 #else 4154 #define splatq_laneq_s8(__p0, __p1) __extension__ ({ \ 4155 int8x16_t __ret; \ 4156 int8x16_t __s0 = __p0; \ 4157 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 4158 __ret = (int8x16_t) __builtin_neon_splatq_laneq_v((int8x16_t)__rev0, __p1, 32); \ 4159 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 4160 __ret; \ 4161 }) 4162 #define __noswap_splatq_laneq_s8(__p0, __p1) __extension__ ({ \ 4163 int8x16_t __ret; \ 4164 int8x16_t __s0 = __p0; \ 4165 __ret = (int8x16_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 32); \ 4166 __ret; \ 4167 }) 4168 #endif 4169 4170 #ifdef __LITTLE_ENDIAN__ 4171 #define splatq_laneq_f64(__p0, __p1) __extension__ ({ \ 4172 float64x2_t __ret; \ 4173 float64x2_t __s0 = __p0; \ 4174 __ret = (float64x2_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 42); \ 4175 __ret; \ 4176 }) 4177 #else 4178 #define splatq_laneq_f64(__p0, __p1) __extension__ ({ \ 4179 float64x2_t __ret; \ 4180 float64x2_t __s0 = __p0; \ 4181 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 4182 __ret = (float64x2_t) __builtin_neon_splatq_laneq_v((int8x16_t)__rev0, __p1, 42); \ 4183 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 4184 __ret; \ 4185 }) 4186 #define __noswap_splatq_laneq_f64(__p0, __p1) __extension__ ({ \ 4187 float64x2_t __ret; \ 4188 float64x2_t __s0 = __p0; \ 4189 __ret = (float64x2_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 42); \ 4190 __ret; \ 4191 }) 4192 #endif 4193 4194 #ifdef __LITTLE_ENDIAN__ 4195 #define splatq_laneq_f32(__p0, __p1) __extension__ ({ \ 4196 float32x4_t __ret; \ 4197 float32x4_t __s0 = __p0; \ 4198 __ret = (float32x4_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 41); \ 4199 __ret; \ 4200 }) 4201 #else 4202 #define splatq_laneq_f32(__p0, __p1) __extension__ ({ \ 4203 float32x4_t __ret; \ 4204 float32x4_t __s0 = __p0; \ 4205 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 4206 __ret = (float32x4_t) __builtin_neon_splatq_laneq_v((int8x16_t)__rev0, __p1, 41); \ 4207 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 4208 __ret; \ 4209 }) 4210 #define __noswap_splatq_laneq_f32(__p0, __p1) __extension__ ({ \ 4211 float32x4_t __ret; \ 4212 float32x4_t __s0 = __p0; \ 4213 __ret = (float32x4_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 41); \ 4214 __ret; \ 4215 }) 4216 #endif 4217 4218 #ifdef __LITTLE_ENDIAN__ 4219 #define splatq_laneq_f16(__p0, __p1) __extension__ ({ \ 4220 float16x8_t __ret; \ 4221 float16x8_t __s0 = __p0; \ 4222 __ret = (float16x8_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 40); \ 4223 __ret; \ 4224 }) 4225 #else 4226 #define splatq_laneq_f16(__p0, __p1) __extension__ ({ \ 4227 float16x8_t __ret; \ 4228 float16x8_t __s0 = __p0; \ 4229 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 4230 __ret = (float16x8_t) __builtin_neon_splatq_laneq_v((int8x16_t)__rev0, __p1, 40); \ 4231 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 4232 __ret; \ 4233 }) 4234 #define __noswap_splatq_laneq_f16(__p0, __p1) __extension__ ({ \ 4235 float16x8_t __ret; \ 4236 float16x8_t __s0 = __p0; \ 4237 __ret = (float16x8_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 40); \ 4238 __ret; \ 4239 }) 4240 #endif 4241 4242 #ifdef __LITTLE_ENDIAN__ 4243 #define splatq_laneq_s32(__p0, __p1) __extension__ ({ \ 4244 int32x4_t __ret; \ 4245 int32x4_t __s0 = __p0; \ 4246 __ret = (int32x4_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 34); \ 4247 __ret; \ 4248 }) 4249 #else 4250 #define splatq_laneq_s32(__p0, __p1) __extension__ ({ \ 4251 int32x4_t __ret; \ 4252 int32x4_t __s0 = __p0; \ 4253 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 4254 __ret = (int32x4_t) __builtin_neon_splatq_laneq_v((int8x16_t)__rev0, __p1, 34); \ 4255 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 4256 __ret; \ 4257 }) 4258 #define __noswap_splatq_laneq_s32(__p0, __p1) __extension__ ({ \ 4259 int32x4_t __ret; \ 4260 int32x4_t __s0 = __p0; \ 4261 __ret = (int32x4_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 34); \ 4262 __ret; \ 4263 }) 4264 #endif 4265 4266 #ifdef __LITTLE_ENDIAN__ 4267 #define splatq_laneq_s64(__p0, __p1) __extension__ ({ \ 4268 int64x2_t __ret; \ 4269 int64x2_t __s0 = __p0; \ 4270 __ret = (int64x2_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 35); \ 4271 __ret; \ 4272 }) 4273 #else 4274 #define splatq_laneq_s64(__p0, __p1) __extension__ ({ \ 4275 int64x2_t __ret; \ 4276 int64x2_t __s0 = __p0; \ 4277 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 4278 __ret = (int64x2_t) __builtin_neon_splatq_laneq_v((int8x16_t)__rev0, __p1, 35); \ 4279 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 4280 __ret; \ 4281 }) 4282 #define __noswap_splatq_laneq_s64(__p0, __p1) __extension__ ({ \ 4283 int64x2_t __ret; \ 4284 int64x2_t __s0 = __p0; \ 4285 __ret = (int64x2_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 35); \ 4286 __ret; \ 4287 }) 4288 #endif 4289 4290 #ifdef __LITTLE_ENDIAN__ 4291 #define splatq_laneq_s16(__p0, __p1) __extension__ ({ \ 4292 int16x8_t __ret; \ 4293 int16x8_t __s0 = __p0; \ 4294 __ret = (int16x8_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 33); \ 4295 __ret; \ 4296 }) 4297 #else 4298 #define splatq_laneq_s16(__p0, __p1) __extension__ ({ \ 4299 int16x8_t __ret; \ 4300 int16x8_t __s0 = __p0; \ 4301 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 4302 __ret = (int16x8_t) __builtin_neon_splatq_laneq_v((int8x16_t)__rev0, __p1, 33); \ 4303 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 4304 __ret; \ 4305 }) 4306 #define __noswap_splatq_laneq_s16(__p0, __p1) __extension__ ({ \ 4307 int16x8_t __ret; \ 4308 int16x8_t __s0 = __p0; \ 4309 __ret = (int16x8_t) __builtin_neon_splatq_laneq_v((int8x16_t)__s0, __p1, 33); \ 4310 __ret; \ 4311 }) 4312 #endif 4313 4314 #ifdef __LITTLE_ENDIAN__ 4315 #define splat_laneq_u8(__p0, __p1) __extension__ ({ \ 4316 uint8x8_t __ret; \ 4317 uint8x16_t __s0 = __p0; \ 4318 __ret = (uint8x8_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 48); \ 4319 __ret; \ 4320 }) 4321 #else 4322 #define splat_laneq_u8(__p0, __p1) __extension__ ({ \ 4323 uint8x8_t __ret; \ 4324 uint8x16_t __s0 = __p0; \ 4325 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 4326 __ret = (uint8x8_t) __builtin_neon_splat_laneq_v((int8x16_t)__rev0, __p1, 48); \ 4327 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 4328 __ret; \ 4329 }) 4330 #define __noswap_splat_laneq_u8(__p0, __p1) __extension__ ({ \ 4331 uint8x8_t __ret; \ 4332 uint8x16_t __s0 = __p0; \ 4333 __ret = (uint8x8_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 48); \ 4334 __ret; \ 4335 }) 4336 #endif 4337 4338 #ifdef __LITTLE_ENDIAN__ 4339 #define splat_laneq_u32(__p0, __p1) __extension__ ({ \ 4340 uint32x2_t __ret; \ 4341 uint32x4_t __s0 = __p0; \ 4342 __ret = (uint32x2_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 50); \ 4343 __ret; \ 4344 }) 4345 #else 4346 #define splat_laneq_u32(__p0, __p1) __extension__ ({ \ 4347 uint32x2_t __ret; \ 4348 uint32x4_t __s0 = __p0; \ 4349 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 4350 __ret = (uint32x2_t) __builtin_neon_splat_laneq_v((int8x16_t)__rev0, __p1, 50); \ 4351 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 4352 __ret; \ 4353 }) 4354 #define __noswap_splat_laneq_u32(__p0, __p1) __extension__ ({ \ 4355 uint32x2_t __ret; \ 4356 uint32x4_t __s0 = __p0; \ 4357 __ret = (uint32x2_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 50); \ 4358 __ret; \ 4359 }) 4360 #endif 4361 4362 #ifdef __LITTLE_ENDIAN__ 4363 #define splat_laneq_u64(__p0, __p1) __extension__ ({ \ 4364 uint64x1_t __ret; \ 4365 uint64x2_t __s0 = __p0; \ 4366 __ret = (uint64x1_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 51); \ 4367 __ret; \ 4368 }) 4369 #else 4370 #define splat_laneq_u64(__p0, __p1) __extension__ ({ \ 4371 uint64x1_t __ret; \ 4372 uint64x2_t __s0 = __p0; \ 4373 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 4374 __ret = (uint64x1_t) __builtin_neon_splat_laneq_v((int8x16_t)__rev0, __p1, 51); \ 4375 __ret; \ 4376 }) 4377 #define __noswap_splat_laneq_u64(__p0, __p1) __extension__ ({ \ 4378 uint64x1_t __ret; \ 4379 uint64x2_t __s0 = __p0; \ 4380 __ret = (uint64x1_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 51); \ 4381 __ret; \ 4382 }) 4383 #endif 4384 4385 #ifdef __LITTLE_ENDIAN__ 4386 #define splat_laneq_u16(__p0, __p1) __extension__ ({ \ 4387 uint16x4_t __ret; \ 4388 uint16x8_t __s0 = __p0; \ 4389 __ret = (uint16x4_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 49); \ 4390 __ret; \ 4391 }) 4392 #else 4393 #define splat_laneq_u16(__p0, __p1) __extension__ ({ \ 4394 uint16x4_t __ret; \ 4395 uint16x8_t __s0 = __p0; \ 4396 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 4397 __ret = (uint16x4_t) __builtin_neon_splat_laneq_v((int8x16_t)__rev0, __p1, 49); \ 4398 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 4399 __ret; \ 4400 }) 4401 #define __noswap_splat_laneq_u16(__p0, __p1) __extension__ ({ \ 4402 uint16x4_t __ret; \ 4403 uint16x8_t __s0 = __p0; \ 4404 __ret = (uint16x4_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 49); \ 4405 __ret; \ 4406 }) 4407 #endif 4408 4409 #ifdef __LITTLE_ENDIAN__ 4410 #define splat_laneq_s8(__p0, __p1) __extension__ ({ \ 4411 int8x8_t __ret; \ 4412 int8x16_t __s0 = __p0; \ 4413 __ret = (int8x8_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 32); \ 4414 __ret; \ 4415 }) 4416 #else 4417 #define splat_laneq_s8(__p0, __p1) __extension__ ({ \ 4418 int8x8_t __ret; \ 4419 int8x16_t __s0 = __p0; \ 4420 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 4421 __ret = (int8x8_t) __builtin_neon_splat_laneq_v((int8x16_t)__rev0, __p1, 32); \ 4422 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 4423 __ret; \ 4424 }) 4425 #define __noswap_splat_laneq_s8(__p0, __p1) __extension__ ({ \ 4426 int8x8_t __ret; \ 4427 int8x16_t __s0 = __p0; \ 4428 __ret = (int8x8_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 32); \ 4429 __ret; \ 4430 }) 4431 #endif 4432 4433 #ifdef __LITTLE_ENDIAN__ 4434 #define splat_laneq_f64(__p0, __p1) __extension__ ({ \ 4435 float64x1_t __ret; \ 4436 float64x2_t __s0 = __p0; \ 4437 __ret = (float64x1_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 42); \ 4438 __ret; \ 4439 }) 4440 #else 4441 #define splat_laneq_f64(__p0, __p1) __extension__ ({ \ 4442 float64x1_t __ret; \ 4443 float64x2_t __s0 = __p0; \ 4444 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 4445 __ret = (float64x1_t) __builtin_neon_splat_laneq_v((int8x16_t)__rev0, __p1, 42); \ 4446 __ret; \ 4447 }) 4448 #define __noswap_splat_laneq_f64(__p0, __p1) __extension__ ({ \ 4449 float64x1_t __ret; \ 4450 float64x2_t __s0 = __p0; \ 4451 __ret = (float64x1_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 42); \ 4452 __ret; \ 4453 }) 4454 #endif 4455 4456 #ifdef __LITTLE_ENDIAN__ 4457 #define splat_laneq_f32(__p0, __p1) __extension__ ({ \ 4458 float32x2_t __ret; \ 4459 float32x4_t __s0 = __p0; \ 4460 __ret = (float32x2_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 41); \ 4461 __ret; \ 4462 }) 4463 #else 4464 #define splat_laneq_f32(__p0, __p1) __extension__ ({ \ 4465 float32x2_t __ret; \ 4466 float32x4_t __s0 = __p0; \ 4467 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 4468 __ret = (float32x2_t) __builtin_neon_splat_laneq_v((int8x16_t)__rev0, __p1, 41); \ 4469 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 4470 __ret; \ 4471 }) 4472 #define __noswap_splat_laneq_f32(__p0, __p1) __extension__ ({ \ 4473 float32x2_t __ret; \ 4474 float32x4_t __s0 = __p0; \ 4475 __ret = (float32x2_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 41); \ 4476 __ret; \ 4477 }) 4478 #endif 4479 4480 #ifdef __LITTLE_ENDIAN__ 4481 #define splat_laneq_f16(__p0, __p1) __extension__ ({ \ 4482 float16x4_t __ret; \ 4483 float16x8_t __s0 = __p0; \ 4484 __ret = (float16x4_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 40); \ 4485 __ret; \ 4486 }) 4487 #else 4488 #define splat_laneq_f16(__p0, __p1) __extension__ ({ \ 4489 float16x4_t __ret; \ 4490 float16x8_t __s0 = __p0; \ 4491 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 4492 __ret = (float16x4_t) __builtin_neon_splat_laneq_v((int8x16_t)__rev0, __p1, 40); \ 4493 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 4494 __ret; \ 4495 }) 4496 #define __noswap_splat_laneq_f16(__p0, __p1) __extension__ ({ \ 4497 float16x4_t __ret; \ 4498 float16x8_t __s0 = __p0; \ 4499 __ret = (float16x4_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 40); \ 4500 __ret; \ 4501 }) 4502 #endif 4503 4504 #ifdef __LITTLE_ENDIAN__ 4505 #define splat_laneq_s32(__p0, __p1) __extension__ ({ \ 4506 int32x2_t __ret; \ 4507 int32x4_t __s0 = __p0; \ 4508 __ret = (int32x2_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 34); \ 4509 __ret; \ 4510 }) 4511 #else 4512 #define splat_laneq_s32(__p0, __p1) __extension__ ({ \ 4513 int32x2_t __ret; \ 4514 int32x4_t __s0 = __p0; \ 4515 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 4516 __ret = (int32x2_t) __builtin_neon_splat_laneq_v((int8x16_t)__rev0, __p1, 34); \ 4517 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 4518 __ret; \ 4519 }) 4520 #define __noswap_splat_laneq_s32(__p0, __p1) __extension__ ({ \ 4521 int32x2_t __ret; \ 4522 int32x4_t __s0 = __p0; \ 4523 __ret = (int32x2_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 34); \ 4524 __ret; \ 4525 }) 4526 #endif 4527 4528 #ifdef __LITTLE_ENDIAN__ 4529 #define splat_laneq_s64(__p0, __p1) __extension__ ({ \ 4530 int64x1_t __ret; \ 4531 int64x2_t __s0 = __p0; \ 4532 __ret = (int64x1_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 35); \ 4533 __ret; \ 4534 }) 4535 #else 4536 #define splat_laneq_s64(__p0, __p1) __extension__ ({ \ 4537 int64x1_t __ret; \ 4538 int64x2_t __s0 = __p0; \ 4539 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 4540 __ret = (int64x1_t) __builtin_neon_splat_laneq_v((int8x16_t)__rev0, __p1, 35); \ 4541 __ret; \ 4542 }) 4543 #define __noswap_splat_laneq_s64(__p0, __p1) __extension__ ({ \ 4544 int64x1_t __ret; \ 4545 int64x2_t __s0 = __p0; \ 4546 __ret = (int64x1_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 35); \ 4547 __ret; \ 4548 }) 4549 #endif 4550 4551 #ifdef __LITTLE_ENDIAN__ 4552 #define splat_laneq_s16(__p0, __p1) __extension__ ({ \ 4553 int16x4_t __ret; \ 4554 int16x8_t __s0 = __p0; \ 4555 __ret = (int16x4_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 33); \ 4556 __ret; \ 4557 }) 4558 #else 4559 #define splat_laneq_s16(__p0, __p1) __extension__ ({ \ 4560 int16x4_t __ret; \ 4561 int16x8_t __s0 = __p0; \ 4562 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 4563 __ret = (int16x4_t) __builtin_neon_splat_laneq_v((int8x16_t)__rev0, __p1, 33); \ 4564 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 4565 __ret; \ 4566 }) 4567 #define __noswap_splat_laneq_s16(__p0, __p1) __extension__ ({ \ 4568 int16x4_t __ret; \ 4569 int16x8_t __s0 = __p0; \ 4570 __ret = (int16x4_t) __builtin_neon_splat_laneq_v((int8x16_t)__s0, __p1, 33); \ 4571 __ret; \ 4572 }) 4573 #endif 4574 4575 #ifdef __LITTLE_ENDIAN__ 4576 __ai __attribute__((target("neon"))) uint8x16_t vabdq_u8(uint8x16_t __p0, uint8x16_t __p1) { 4577 uint8x16_t __ret; 4578 __ret = (uint8x16_t) __builtin_neon_vabdq_v((int8x16_t)__p0, (int8x16_t)__p1, 48); 4579 return __ret; 4580 } 4581 #else 4582 __ai __attribute__((target("neon"))) uint8x16_t vabdq_u8(uint8x16_t __p0, uint8x16_t __p1) { 4583 uint8x16_t __ret; 4584 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 4585 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 4586 __ret = (uint8x16_t) __builtin_neon_vabdq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48); 4587 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 4588 return __ret; 4589 } 4590 __ai __attribute__((target("neon"))) uint8x16_t __noswap_vabdq_u8(uint8x16_t __p0, uint8x16_t __p1) { 4591 uint8x16_t __ret; 4592 __ret = (uint8x16_t) __builtin_neon_vabdq_v((int8x16_t)__p0, (int8x16_t)__p1, 48); 4593 return __ret; 4594 } 4595 #endif 4596 4597 #ifdef __LITTLE_ENDIAN__ 4598 __ai __attribute__((target("neon"))) uint32x4_t vabdq_u32(uint32x4_t __p0, uint32x4_t __p1) { 4599 uint32x4_t __ret; 4600 __ret = (uint32x4_t) __builtin_neon_vabdq_v((int8x16_t)__p0, (int8x16_t)__p1, 50); 4601 return __ret; 4602 } 4603 #else 4604 __ai __attribute__((target("neon"))) uint32x4_t vabdq_u32(uint32x4_t __p0, uint32x4_t __p1) { 4605 uint32x4_t __ret; 4606 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 4607 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 4608 __ret = (uint32x4_t) __builtin_neon_vabdq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50); 4609 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 4610 return __ret; 4611 } 4612 __ai __attribute__((target("neon"))) uint32x4_t __noswap_vabdq_u32(uint32x4_t __p0, uint32x4_t __p1) { 4613 uint32x4_t __ret; 4614 __ret = (uint32x4_t) __builtin_neon_vabdq_v((int8x16_t)__p0, (int8x16_t)__p1, 50); 4615 return __ret; 4616 } 4617 #endif 4618 4619 #ifdef __LITTLE_ENDIAN__ 4620 __ai __attribute__((target("neon"))) uint16x8_t vabdq_u16(uint16x8_t __p0, uint16x8_t __p1) { 4621 uint16x8_t __ret; 4622 __ret = (uint16x8_t) __builtin_neon_vabdq_v((int8x16_t)__p0, (int8x16_t)__p1, 49); 4623 return __ret; 4624 } 4625 #else 4626 __ai __attribute__((target("neon"))) uint16x8_t vabdq_u16(uint16x8_t __p0, uint16x8_t __p1) { 4627 uint16x8_t __ret; 4628 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 4629 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 4630 __ret = (uint16x8_t) __builtin_neon_vabdq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49); 4631 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 4632 return __ret; 4633 } 4634 __ai __attribute__((target("neon"))) uint16x8_t __noswap_vabdq_u16(uint16x8_t __p0, uint16x8_t __p1) { 4635 uint16x8_t __ret; 4636 __ret = (uint16x8_t) __builtin_neon_vabdq_v((int8x16_t)__p0, (int8x16_t)__p1, 49); 4637 return __ret; 4638 } 4639 #endif 4640 4641 #ifdef __LITTLE_ENDIAN__ 4642 __ai __attribute__((target("neon"))) int8x16_t vabdq_s8(int8x16_t __p0, int8x16_t __p1) { 4643 int8x16_t __ret; 4644 __ret = (int8x16_t) __builtin_neon_vabdq_v((int8x16_t)__p0, (int8x16_t)__p1, 32); 4645 return __ret; 4646 } 4647 #else 4648 __ai __attribute__((target("neon"))) int8x16_t vabdq_s8(int8x16_t __p0, int8x16_t __p1) { 4649 int8x16_t __ret; 4650 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 4651 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 4652 __ret = (int8x16_t) __builtin_neon_vabdq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32); 4653 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 4654 return __ret; 4655 } 4656 __ai __attribute__((target("neon"))) int8x16_t __noswap_vabdq_s8(int8x16_t __p0, int8x16_t __p1) { 4657 int8x16_t __ret; 4658 __ret = (int8x16_t) __builtin_neon_vabdq_v((int8x16_t)__p0, (int8x16_t)__p1, 32); 4659 return __ret; 4660 } 4661 #endif 4662 4663 #ifdef __LITTLE_ENDIAN__ 4664 __ai __attribute__((target("neon"))) float32x4_t vabdq_f32(float32x4_t __p0, float32x4_t __p1) { 4665 float32x4_t __ret; 4666 __ret = (float32x4_t) __builtin_neon_vabdq_v((int8x16_t)__p0, (int8x16_t)__p1, 41); 4667 return __ret; 4668 } 4669 #else 4670 __ai __attribute__((target("neon"))) float32x4_t vabdq_f32(float32x4_t __p0, float32x4_t __p1) { 4671 float32x4_t __ret; 4672 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 4673 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 4674 __ret = (float32x4_t) __builtin_neon_vabdq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 41); 4675 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 4676 return __ret; 4677 } 4678 #endif 4679 4680 #ifdef __LITTLE_ENDIAN__ 4681 __ai __attribute__((target("neon"))) int32x4_t vabdq_s32(int32x4_t __p0, int32x4_t __p1) { 4682 int32x4_t __ret; 4683 __ret = (int32x4_t) __builtin_neon_vabdq_v((int8x16_t)__p0, (int8x16_t)__p1, 34); 4684 return __ret; 4685 } 4686 #else 4687 __ai __attribute__((target("neon"))) int32x4_t vabdq_s32(int32x4_t __p0, int32x4_t __p1) { 4688 int32x4_t __ret; 4689 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 4690 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 4691 __ret = (int32x4_t) __builtin_neon_vabdq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34); 4692 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 4693 return __ret; 4694 } 4695 __ai __attribute__((target("neon"))) int32x4_t __noswap_vabdq_s32(int32x4_t __p0, int32x4_t __p1) { 4696 int32x4_t __ret; 4697 __ret = (int32x4_t) __builtin_neon_vabdq_v((int8x16_t)__p0, (int8x16_t)__p1, 34); 4698 return __ret; 4699 } 4700 #endif 4701 4702 #ifdef __LITTLE_ENDIAN__ 4703 __ai __attribute__((target("neon"))) int16x8_t vabdq_s16(int16x8_t __p0, int16x8_t __p1) { 4704 int16x8_t __ret; 4705 __ret = (int16x8_t) __builtin_neon_vabdq_v((int8x16_t)__p0, (int8x16_t)__p1, 33); 4706 return __ret; 4707 } 4708 #else 4709 __ai __attribute__((target("neon"))) int16x8_t vabdq_s16(int16x8_t __p0, int16x8_t __p1) { 4710 int16x8_t __ret; 4711 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 4712 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 4713 __ret = (int16x8_t) __builtin_neon_vabdq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33); 4714 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 4715 return __ret; 4716 } 4717 __ai __attribute__((target("neon"))) int16x8_t __noswap_vabdq_s16(int16x8_t __p0, int16x8_t __p1) { 4718 int16x8_t __ret; 4719 __ret = (int16x8_t) __builtin_neon_vabdq_v((int8x16_t)__p0, (int8x16_t)__p1, 33); 4720 return __ret; 4721 } 4722 #endif 4723 4724 #ifdef __LITTLE_ENDIAN__ 4725 __ai __attribute__((target("neon"))) uint8x8_t vabd_u8(uint8x8_t __p0, uint8x8_t __p1) { 4726 uint8x8_t __ret; 4727 __ret = (uint8x8_t) __builtin_neon_vabd_v((int8x8_t)__p0, (int8x8_t)__p1, 16); 4728 return __ret; 4729 } 4730 #else 4731 __ai __attribute__((target("neon"))) uint8x8_t vabd_u8(uint8x8_t __p0, uint8x8_t __p1) { 4732 uint8x8_t __ret; 4733 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 4734 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 4735 __ret = (uint8x8_t) __builtin_neon_vabd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16); 4736 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 4737 return __ret; 4738 } 4739 __ai __attribute__((target("neon"))) uint8x8_t __noswap_vabd_u8(uint8x8_t __p0, uint8x8_t __p1) { 4740 uint8x8_t __ret; 4741 __ret = (uint8x8_t) __builtin_neon_vabd_v((int8x8_t)__p0, (int8x8_t)__p1, 16); 4742 return __ret; 4743 } 4744 #endif 4745 4746 #ifdef __LITTLE_ENDIAN__ 4747 __ai __attribute__((target("neon"))) uint32x2_t vabd_u32(uint32x2_t __p0, uint32x2_t __p1) { 4748 uint32x2_t __ret; 4749 __ret = (uint32x2_t) __builtin_neon_vabd_v((int8x8_t)__p0, (int8x8_t)__p1, 18); 4750 return __ret; 4751 } 4752 #else 4753 __ai __attribute__((target("neon"))) uint32x2_t vabd_u32(uint32x2_t __p0, uint32x2_t __p1) { 4754 uint32x2_t __ret; 4755 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 4756 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 4757 __ret = (uint32x2_t) __builtin_neon_vabd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18); 4758 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 4759 return __ret; 4760 } 4761 __ai __attribute__((target("neon"))) uint32x2_t __noswap_vabd_u32(uint32x2_t __p0, uint32x2_t __p1) { 4762 uint32x2_t __ret; 4763 __ret = (uint32x2_t) __builtin_neon_vabd_v((int8x8_t)__p0, (int8x8_t)__p1, 18); 4764 return __ret; 4765 } 4766 #endif 4767 4768 #ifdef __LITTLE_ENDIAN__ 4769 __ai __attribute__((target("neon"))) uint16x4_t vabd_u16(uint16x4_t __p0, uint16x4_t __p1) { 4770 uint16x4_t __ret; 4771 __ret = (uint16x4_t) __builtin_neon_vabd_v((int8x8_t)__p0, (int8x8_t)__p1, 17); 4772 return __ret; 4773 } 4774 #else 4775 __ai __attribute__((target("neon"))) uint16x4_t vabd_u16(uint16x4_t __p0, uint16x4_t __p1) { 4776 uint16x4_t __ret; 4777 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 4778 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 4779 __ret = (uint16x4_t) __builtin_neon_vabd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17); 4780 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 4781 return __ret; 4782 } 4783 __ai __attribute__((target("neon"))) uint16x4_t __noswap_vabd_u16(uint16x4_t __p0, uint16x4_t __p1) { 4784 uint16x4_t __ret; 4785 __ret = (uint16x4_t) __builtin_neon_vabd_v((int8x8_t)__p0, (int8x8_t)__p1, 17); 4786 return __ret; 4787 } 4788 #endif 4789 4790 #ifdef __LITTLE_ENDIAN__ 4791 __ai __attribute__((target("neon"))) int8x8_t vabd_s8(int8x8_t __p0, int8x8_t __p1) { 4792 int8x8_t __ret; 4793 __ret = (int8x8_t) __builtin_neon_vabd_v((int8x8_t)__p0, (int8x8_t)__p1, 0); 4794 return __ret; 4795 } 4796 #else 4797 __ai __attribute__((target("neon"))) int8x8_t vabd_s8(int8x8_t __p0, int8x8_t __p1) { 4798 int8x8_t __ret; 4799 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 4800 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 4801 __ret = (int8x8_t) __builtin_neon_vabd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0); 4802 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 4803 return __ret; 4804 } 4805 __ai __attribute__((target("neon"))) int8x8_t __noswap_vabd_s8(int8x8_t __p0, int8x8_t __p1) { 4806 int8x8_t __ret; 4807 __ret = (int8x8_t) __builtin_neon_vabd_v((int8x8_t)__p0, (int8x8_t)__p1, 0); 4808 return __ret; 4809 } 4810 #endif 4811 4812 #ifdef __LITTLE_ENDIAN__ 4813 __ai __attribute__((target("neon"))) float32x2_t vabd_f32(float32x2_t __p0, float32x2_t __p1) { 4814 float32x2_t __ret; 4815 __ret = (float32x2_t) __builtin_neon_vabd_v((int8x8_t)__p0, (int8x8_t)__p1, 9); 4816 return __ret; 4817 } 4818 #else 4819 __ai __attribute__((target("neon"))) float32x2_t vabd_f32(float32x2_t __p0, float32x2_t __p1) { 4820 float32x2_t __ret; 4821 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 4822 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 4823 __ret = (float32x2_t) __builtin_neon_vabd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 9); 4824 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 4825 return __ret; 4826 } 4827 #endif 4828 4829 #ifdef __LITTLE_ENDIAN__ 4830 __ai __attribute__((target("neon"))) int32x2_t vabd_s32(int32x2_t __p0, int32x2_t __p1) { 4831 int32x2_t __ret; 4832 __ret = (int32x2_t) __builtin_neon_vabd_v((int8x8_t)__p0, (int8x8_t)__p1, 2); 4833 return __ret; 4834 } 4835 #else 4836 __ai __attribute__((target("neon"))) int32x2_t vabd_s32(int32x2_t __p0, int32x2_t __p1) { 4837 int32x2_t __ret; 4838 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 4839 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 4840 __ret = (int32x2_t) __builtin_neon_vabd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2); 4841 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 4842 return __ret; 4843 } 4844 __ai __attribute__((target("neon"))) int32x2_t __noswap_vabd_s32(int32x2_t __p0, int32x2_t __p1) { 4845 int32x2_t __ret; 4846 __ret = (int32x2_t) __builtin_neon_vabd_v((int8x8_t)__p0, (int8x8_t)__p1, 2); 4847 return __ret; 4848 } 4849 #endif 4850 4851 #ifdef __LITTLE_ENDIAN__ 4852 __ai __attribute__((target("neon"))) int16x4_t vabd_s16(int16x4_t __p0, int16x4_t __p1) { 4853 int16x4_t __ret; 4854 __ret = (int16x4_t) __builtin_neon_vabd_v((int8x8_t)__p0, (int8x8_t)__p1, 1); 4855 return __ret; 4856 } 4857 #else 4858 __ai __attribute__((target("neon"))) int16x4_t vabd_s16(int16x4_t __p0, int16x4_t __p1) { 4859 int16x4_t __ret; 4860 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 4861 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 4862 __ret = (int16x4_t) __builtin_neon_vabd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1); 4863 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 4864 return __ret; 4865 } 4866 __ai __attribute__((target("neon"))) int16x4_t __noswap_vabd_s16(int16x4_t __p0, int16x4_t __p1) { 4867 int16x4_t __ret; 4868 __ret = (int16x4_t) __builtin_neon_vabd_v((int8x8_t)__p0, (int8x8_t)__p1, 1); 4869 return __ret; 4870 } 4871 #endif 4872 4873 #ifdef __LITTLE_ENDIAN__ 4874 __ai __attribute__((target("neon"))) int8x16_t vabsq_s8(int8x16_t __p0) { 4875 int8x16_t __ret; 4876 __ret = (int8x16_t) __builtin_neon_vabsq_v((int8x16_t)__p0, 32); 4877 return __ret; 4878 } 4879 #else 4880 __ai __attribute__((target("neon"))) int8x16_t vabsq_s8(int8x16_t __p0) { 4881 int8x16_t __ret; 4882 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 4883 __ret = (int8x16_t) __builtin_neon_vabsq_v((int8x16_t)__rev0, 32); 4884 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 4885 return __ret; 4886 } 4887 #endif 4888 4889 #ifdef __LITTLE_ENDIAN__ 4890 __ai __attribute__((target("neon"))) float32x4_t vabsq_f32(float32x4_t __p0) { 4891 float32x4_t __ret; 4892 __ret = (float32x4_t) __builtin_neon_vabsq_v((int8x16_t)__p0, 41); 4893 return __ret; 4894 } 4895 #else 4896 __ai __attribute__((target("neon"))) float32x4_t vabsq_f32(float32x4_t __p0) { 4897 float32x4_t __ret; 4898 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 4899 __ret = (float32x4_t) __builtin_neon_vabsq_v((int8x16_t)__rev0, 41); 4900 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 4901 return __ret; 4902 } 4903 #endif 4904 4905 #ifdef __LITTLE_ENDIAN__ 4906 __ai __attribute__((target("neon"))) int32x4_t vabsq_s32(int32x4_t __p0) { 4907 int32x4_t __ret; 4908 __ret = (int32x4_t) __builtin_neon_vabsq_v((int8x16_t)__p0, 34); 4909 return __ret; 4910 } 4911 #else 4912 __ai __attribute__((target("neon"))) int32x4_t vabsq_s32(int32x4_t __p0) { 4913 int32x4_t __ret; 4914 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 4915 __ret = (int32x4_t) __builtin_neon_vabsq_v((int8x16_t)__rev0, 34); 4916 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 4917 return __ret; 4918 } 4919 #endif 4920 4921 #ifdef __LITTLE_ENDIAN__ 4922 __ai __attribute__((target("neon"))) int16x8_t vabsq_s16(int16x8_t __p0) { 4923 int16x8_t __ret; 4924 __ret = (int16x8_t) __builtin_neon_vabsq_v((int8x16_t)__p0, 33); 4925 return __ret; 4926 } 4927 #else 4928 __ai __attribute__((target("neon"))) int16x8_t vabsq_s16(int16x8_t __p0) { 4929 int16x8_t __ret; 4930 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 4931 __ret = (int16x8_t) __builtin_neon_vabsq_v((int8x16_t)__rev0, 33); 4932 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 4933 return __ret; 4934 } 4935 #endif 4936 4937 #ifdef __LITTLE_ENDIAN__ 4938 __ai __attribute__((target("neon"))) int8x8_t vabs_s8(int8x8_t __p0) { 4939 int8x8_t __ret; 4940 __ret = (int8x8_t) __builtin_neon_vabs_v((int8x8_t)__p0, 0); 4941 return __ret; 4942 } 4943 #else 4944 __ai __attribute__((target("neon"))) int8x8_t vabs_s8(int8x8_t __p0) { 4945 int8x8_t __ret; 4946 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 4947 __ret = (int8x8_t) __builtin_neon_vabs_v((int8x8_t)__rev0, 0); 4948 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 4949 return __ret; 4950 } 4951 #endif 4952 4953 #ifdef __LITTLE_ENDIAN__ 4954 __ai __attribute__((target("neon"))) float32x2_t vabs_f32(float32x2_t __p0) { 4955 float32x2_t __ret; 4956 __ret = (float32x2_t) __builtin_neon_vabs_v((int8x8_t)__p0, 9); 4957 return __ret; 4958 } 4959 #else 4960 __ai __attribute__((target("neon"))) float32x2_t vabs_f32(float32x2_t __p0) { 4961 float32x2_t __ret; 4962 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 4963 __ret = (float32x2_t) __builtin_neon_vabs_v((int8x8_t)__rev0, 9); 4964 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 4965 return __ret; 4966 } 4967 #endif 4968 4969 #ifdef __LITTLE_ENDIAN__ 4970 __ai __attribute__((target("neon"))) int32x2_t vabs_s32(int32x2_t __p0) { 4971 int32x2_t __ret; 4972 __ret = (int32x2_t) __builtin_neon_vabs_v((int8x8_t)__p0, 2); 4973 return __ret; 4974 } 4975 #else 4976 __ai __attribute__((target("neon"))) int32x2_t vabs_s32(int32x2_t __p0) { 4977 int32x2_t __ret; 4978 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 4979 __ret = (int32x2_t) __builtin_neon_vabs_v((int8x8_t)__rev0, 2); 4980 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 4981 return __ret; 4982 } 4983 #endif 4984 4985 #ifdef __LITTLE_ENDIAN__ 4986 __ai __attribute__((target("neon"))) int16x4_t vabs_s16(int16x4_t __p0) { 4987 int16x4_t __ret; 4988 __ret = (int16x4_t) __builtin_neon_vabs_v((int8x8_t)__p0, 1); 4989 return __ret; 4990 } 4991 #else 4992 __ai __attribute__((target("neon"))) int16x4_t vabs_s16(int16x4_t __p0) { 4993 int16x4_t __ret; 4994 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 4995 __ret = (int16x4_t) __builtin_neon_vabs_v((int8x8_t)__rev0, 1); 4996 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 4997 return __ret; 4998 } 4999 #endif 5000 5001 #ifdef __LITTLE_ENDIAN__ 5002 __ai __attribute__((target("neon"))) uint8x16_t vaddq_u8(uint8x16_t __p0, uint8x16_t __p1) { 5003 uint8x16_t __ret; 5004 __ret = __p0 + __p1; 5005 return __ret; 5006 } 5007 #else 5008 __ai __attribute__((target("neon"))) uint8x16_t vaddq_u8(uint8x16_t __p0, uint8x16_t __p1) { 5009 uint8x16_t __ret; 5010 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 5011 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 5012 __ret = __rev0 + __rev1; 5013 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 5014 return __ret; 5015 } 5016 #endif 5017 5018 #ifdef __LITTLE_ENDIAN__ 5019 __ai __attribute__((target("neon"))) uint32x4_t vaddq_u32(uint32x4_t __p0, uint32x4_t __p1) { 5020 uint32x4_t __ret; 5021 __ret = __p0 + __p1; 5022 return __ret; 5023 } 5024 #else 5025 __ai __attribute__((target("neon"))) uint32x4_t vaddq_u32(uint32x4_t __p0, uint32x4_t __p1) { 5026 uint32x4_t __ret; 5027 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 5028 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 5029 __ret = __rev0 + __rev1; 5030 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 5031 return __ret; 5032 } 5033 #endif 5034 5035 #ifdef __LITTLE_ENDIAN__ 5036 __ai __attribute__((target("neon"))) uint64x2_t vaddq_u64(uint64x2_t __p0, uint64x2_t __p1) { 5037 uint64x2_t __ret; 5038 __ret = __p0 + __p1; 5039 return __ret; 5040 } 5041 #else 5042 __ai __attribute__((target("neon"))) uint64x2_t vaddq_u64(uint64x2_t __p0, uint64x2_t __p1) { 5043 uint64x2_t __ret; 5044 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 5045 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 5046 __ret = __rev0 + __rev1; 5047 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 5048 return __ret; 5049 } 5050 #endif 5051 5052 #ifdef __LITTLE_ENDIAN__ 5053 __ai __attribute__((target("neon"))) uint16x8_t vaddq_u16(uint16x8_t __p0, uint16x8_t __p1) { 5054 uint16x8_t __ret; 5055 __ret = __p0 + __p1; 5056 return __ret; 5057 } 5058 #else 5059 __ai __attribute__((target("neon"))) uint16x8_t vaddq_u16(uint16x8_t __p0, uint16x8_t __p1) { 5060 uint16x8_t __ret; 5061 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 5062 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 5063 __ret = __rev0 + __rev1; 5064 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 5065 return __ret; 5066 } 5067 #endif 5068 5069 #ifdef __LITTLE_ENDIAN__ 5070 __ai __attribute__((target("neon"))) int8x16_t vaddq_s8(int8x16_t __p0, int8x16_t __p1) { 5071 int8x16_t __ret; 5072 __ret = __p0 + __p1; 5073 return __ret; 5074 } 5075 #else 5076 __ai __attribute__((target("neon"))) int8x16_t vaddq_s8(int8x16_t __p0, int8x16_t __p1) { 5077 int8x16_t __ret; 5078 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 5079 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 5080 __ret = __rev0 + __rev1; 5081 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 5082 return __ret; 5083 } 5084 #endif 5085 5086 #ifdef __LITTLE_ENDIAN__ 5087 __ai __attribute__((target("neon"))) float32x4_t vaddq_f32(float32x4_t __p0, float32x4_t __p1) { 5088 float32x4_t __ret; 5089 __ret = __p0 + __p1; 5090 return __ret; 5091 } 5092 #else 5093 __ai __attribute__((target("neon"))) float32x4_t vaddq_f32(float32x4_t __p0, float32x4_t __p1) { 5094 float32x4_t __ret; 5095 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 5096 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 5097 __ret = __rev0 + __rev1; 5098 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 5099 return __ret; 5100 } 5101 #endif 5102 5103 #ifdef __LITTLE_ENDIAN__ 5104 __ai __attribute__((target("neon"))) int32x4_t vaddq_s32(int32x4_t __p0, int32x4_t __p1) { 5105 int32x4_t __ret; 5106 __ret = __p0 + __p1; 5107 return __ret; 5108 } 5109 #else 5110 __ai __attribute__((target("neon"))) int32x4_t vaddq_s32(int32x4_t __p0, int32x4_t __p1) { 5111 int32x4_t __ret; 5112 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 5113 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 5114 __ret = __rev0 + __rev1; 5115 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 5116 return __ret; 5117 } 5118 #endif 5119 5120 #ifdef __LITTLE_ENDIAN__ 5121 __ai __attribute__((target("neon"))) int64x2_t vaddq_s64(int64x2_t __p0, int64x2_t __p1) { 5122 int64x2_t __ret; 5123 __ret = __p0 + __p1; 5124 return __ret; 5125 } 5126 #else 5127 __ai __attribute__((target("neon"))) int64x2_t vaddq_s64(int64x2_t __p0, int64x2_t __p1) { 5128 int64x2_t __ret; 5129 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 5130 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 5131 __ret = __rev0 + __rev1; 5132 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 5133 return __ret; 5134 } 5135 #endif 5136 5137 #ifdef __LITTLE_ENDIAN__ 5138 __ai __attribute__((target("neon"))) int16x8_t vaddq_s16(int16x8_t __p0, int16x8_t __p1) { 5139 int16x8_t __ret; 5140 __ret = __p0 + __p1; 5141 return __ret; 5142 } 5143 #else 5144 __ai __attribute__((target("neon"))) int16x8_t vaddq_s16(int16x8_t __p0, int16x8_t __p1) { 5145 int16x8_t __ret; 5146 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 5147 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 5148 __ret = __rev0 + __rev1; 5149 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 5150 return __ret; 5151 } 5152 #endif 5153 5154 #ifdef __LITTLE_ENDIAN__ 5155 __ai __attribute__((target("neon"))) uint8x8_t vadd_u8(uint8x8_t __p0, uint8x8_t __p1) { 5156 uint8x8_t __ret; 5157 __ret = __p0 + __p1; 5158 return __ret; 5159 } 5160 #else 5161 __ai __attribute__((target("neon"))) uint8x8_t vadd_u8(uint8x8_t __p0, uint8x8_t __p1) { 5162 uint8x8_t __ret; 5163 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 5164 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 5165 __ret = __rev0 + __rev1; 5166 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 5167 return __ret; 5168 } 5169 #endif 5170 5171 #ifdef __LITTLE_ENDIAN__ 5172 __ai __attribute__((target("neon"))) uint32x2_t vadd_u32(uint32x2_t __p0, uint32x2_t __p1) { 5173 uint32x2_t __ret; 5174 __ret = __p0 + __p1; 5175 return __ret; 5176 } 5177 #else 5178 __ai __attribute__((target("neon"))) uint32x2_t vadd_u32(uint32x2_t __p0, uint32x2_t __p1) { 5179 uint32x2_t __ret; 5180 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 5181 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 5182 __ret = __rev0 + __rev1; 5183 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 5184 return __ret; 5185 } 5186 #endif 5187 5188 __ai __attribute__((target("neon"))) uint64x1_t vadd_u64(uint64x1_t __p0, uint64x1_t __p1) { 5189 uint64x1_t __ret; 5190 __ret = __p0 + __p1; 5191 return __ret; 5192 } 5193 #ifdef __LITTLE_ENDIAN__ 5194 __ai __attribute__((target("neon"))) uint16x4_t vadd_u16(uint16x4_t __p0, uint16x4_t __p1) { 5195 uint16x4_t __ret; 5196 __ret = __p0 + __p1; 5197 return __ret; 5198 } 5199 #else 5200 __ai __attribute__((target("neon"))) uint16x4_t vadd_u16(uint16x4_t __p0, uint16x4_t __p1) { 5201 uint16x4_t __ret; 5202 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 5203 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 5204 __ret = __rev0 + __rev1; 5205 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 5206 return __ret; 5207 } 5208 #endif 5209 5210 #ifdef __LITTLE_ENDIAN__ 5211 __ai __attribute__((target("neon"))) int8x8_t vadd_s8(int8x8_t __p0, int8x8_t __p1) { 5212 int8x8_t __ret; 5213 __ret = __p0 + __p1; 5214 return __ret; 5215 } 5216 #else 5217 __ai __attribute__((target("neon"))) int8x8_t vadd_s8(int8x8_t __p0, int8x8_t __p1) { 5218 int8x8_t __ret; 5219 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 5220 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 5221 __ret = __rev0 + __rev1; 5222 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 5223 return __ret; 5224 } 5225 #endif 5226 5227 #ifdef __LITTLE_ENDIAN__ 5228 __ai __attribute__((target("neon"))) float32x2_t vadd_f32(float32x2_t __p0, float32x2_t __p1) { 5229 float32x2_t __ret; 5230 __ret = __p0 + __p1; 5231 return __ret; 5232 } 5233 #else 5234 __ai __attribute__((target("neon"))) float32x2_t vadd_f32(float32x2_t __p0, float32x2_t __p1) { 5235 float32x2_t __ret; 5236 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 5237 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 5238 __ret = __rev0 + __rev1; 5239 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 5240 return __ret; 5241 } 5242 #endif 5243 5244 #ifdef __LITTLE_ENDIAN__ 5245 __ai __attribute__((target("neon"))) int32x2_t vadd_s32(int32x2_t __p0, int32x2_t __p1) { 5246 int32x2_t __ret; 5247 __ret = __p0 + __p1; 5248 return __ret; 5249 } 5250 #else 5251 __ai __attribute__((target("neon"))) int32x2_t vadd_s32(int32x2_t __p0, int32x2_t __p1) { 5252 int32x2_t __ret; 5253 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 5254 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 5255 __ret = __rev0 + __rev1; 5256 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 5257 return __ret; 5258 } 5259 #endif 5260 5261 __ai __attribute__((target("neon"))) int64x1_t vadd_s64(int64x1_t __p0, int64x1_t __p1) { 5262 int64x1_t __ret; 5263 __ret = __p0 + __p1; 5264 return __ret; 5265 } 5266 #ifdef __LITTLE_ENDIAN__ 5267 __ai __attribute__((target("neon"))) int16x4_t vadd_s16(int16x4_t __p0, int16x4_t __p1) { 5268 int16x4_t __ret; 5269 __ret = __p0 + __p1; 5270 return __ret; 5271 } 5272 #else 5273 __ai __attribute__((target("neon"))) int16x4_t vadd_s16(int16x4_t __p0, int16x4_t __p1) { 5274 int16x4_t __ret; 5275 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 5276 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 5277 __ret = __rev0 + __rev1; 5278 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 5279 return __ret; 5280 } 5281 #endif 5282 5283 #ifdef __LITTLE_ENDIAN__ 5284 __ai __attribute__((target("neon"))) poly8x8_t vadd_p8(poly8x8_t __p0, poly8x8_t __p1) { 5285 poly8x8_t __ret; 5286 __ret = (poly8x8_t) __builtin_neon_vadd_v((int8x8_t)__p0, (int8x8_t)__p1, 4); 5287 return __ret; 5288 } 5289 #else 5290 __ai __attribute__((target("neon"))) poly8x8_t vadd_p8(poly8x8_t __p0, poly8x8_t __p1) { 5291 poly8x8_t __ret; 5292 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 5293 poly8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 5294 __ret = (poly8x8_t) __builtin_neon_vadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 4); 5295 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 5296 return __ret; 5297 } 5298 #endif 5299 5300 __ai __attribute__((target("neon"))) poly64x1_t vadd_p64(poly64x1_t __p0, poly64x1_t __p1) { 5301 poly64x1_t __ret; 5302 __ret = (poly64x1_t) __builtin_neon_vadd_v((int8x8_t)__p0, (int8x8_t)__p1, 6); 5303 return __ret; 5304 } 5305 #ifdef __LITTLE_ENDIAN__ 5306 __ai __attribute__((target("neon"))) poly16x4_t vadd_p16(poly16x4_t __p0, poly16x4_t __p1) { 5307 poly16x4_t __ret; 5308 __ret = (poly16x4_t) __builtin_neon_vadd_v((int8x8_t)__p0, (int8x8_t)__p1, 5); 5309 return __ret; 5310 } 5311 #else 5312 __ai __attribute__((target("neon"))) poly16x4_t vadd_p16(poly16x4_t __p0, poly16x4_t __p1) { 5313 poly16x4_t __ret; 5314 poly16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 5315 poly16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 5316 __ret = (poly16x4_t) __builtin_neon_vadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 5); 5317 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 5318 return __ret; 5319 } 5320 #endif 5321 5322 #ifdef __LITTLE_ENDIAN__ 5323 __ai __attribute__((target("neon"))) poly8x16_t vaddq_p8(poly8x16_t __p0, poly8x16_t __p1) { 5324 poly8x16_t __ret; 5325 __ret = (poly8x16_t) __builtin_neon_vaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 36); 5326 return __ret; 5327 } 5328 #else 5329 __ai __attribute__((target("neon"))) poly8x16_t vaddq_p8(poly8x16_t __p0, poly8x16_t __p1) { 5330 poly8x16_t __ret; 5331 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 5332 poly8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 5333 __ret = (poly8x16_t) __builtin_neon_vaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 36); 5334 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 5335 return __ret; 5336 } 5337 #endif 5338 5339 #ifdef __LITTLE_ENDIAN__ 5340 __ai __attribute__((target("neon"))) poly64x2_t vaddq_p64(poly64x2_t __p0, poly64x2_t __p1) { 5341 poly64x2_t __ret; 5342 __ret = (poly64x2_t) __builtin_neon_vaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 38); 5343 return __ret; 5344 } 5345 #else 5346 __ai __attribute__((target("neon"))) poly64x2_t vaddq_p64(poly64x2_t __p0, poly64x2_t __p1) { 5347 poly64x2_t __ret; 5348 poly64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 5349 poly64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 5350 __ret = (poly64x2_t) __builtin_neon_vaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 38); 5351 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 5352 return __ret; 5353 } 5354 #endif 5355 5356 #ifdef __LITTLE_ENDIAN__ 5357 __ai __attribute__((target("neon"))) poly16x8_t vaddq_p16(poly16x8_t __p0, poly16x8_t __p1) { 5358 poly16x8_t __ret; 5359 __ret = (poly16x8_t) __builtin_neon_vaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 37); 5360 return __ret; 5361 } 5362 #else 5363 __ai __attribute__((target("neon"))) poly16x8_t vaddq_p16(poly16x8_t __p0, poly16x8_t __p1) { 5364 poly16x8_t __ret; 5365 poly16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 5366 poly16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 5367 __ret = (poly16x8_t) __builtin_neon_vaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 37); 5368 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 5369 return __ret; 5370 } 5371 #endif 5372 5373 #ifdef __LITTLE_ENDIAN__ 5374 __ai __attribute__((target("neon"))) uint16x4_t vaddhn_u32(uint32x4_t __p0, uint32x4_t __p1) { 5375 uint16x4_t __ret; 5376 __ret = (uint16x4_t) __builtin_neon_vaddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 17); 5377 return __ret; 5378 } 5379 #else 5380 __ai __attribute__((target("neon"))) uint16x4_t vaddhn_u32(uint32x4_t __p0, uint32x4_t __p1) { 5381 uint16x4_t __ret; 5382 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 5383 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 5384 __ret = (uint16x4_t) __builtin_neon_vaddhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 17); 5385 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 5386 return __ret; 5387 } 5388 __ai __attribute__((target("neon"))) uint16x4_t __noswap_vaddhn_u32(uint32x4_t __p0, uint32x4_t __p1) { 5389 uint16x4_t __ret; 5390 __ret = (uint16x4_t) __builtin_neon_vaddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 17); 5391 return __ret; 5392 } 5393 #endif 5394 5395 #ifdef __LITTLE_ENDIAN__ 5396 __ai __attribute__((target("neon"))) uint32x2_t vaddhn_u64(uint64x2_t __p0, uint64x2_t __p1) { 5397 uint32x2_t __ret; 5398 __ret = (uint32x2_t) __builtin_neon_vaddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 18); 5399 return __ret; 5400 } 5401 #else 5402 __ai __attribute__((target("neon"))) uint32x2_t vaddhn_u64(uint64x2_t __p0, uint64x2_t __p1) { 5403 uint32x2_t __ret; 5404 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 5405 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 5406 __ret = (uint32x2_t) __builtin_neon_vaddhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 18); 5407 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 5408 return __ret; 5409 } 5410 __ai __attribute__((target("neon"))) uint32x2_t __noswap_vaddhn_u64(uint64x2_t __p0, uint64x2_t __p1) { 5411 uint32x2_t __ret; 5412 __ret = (uint32x2_t) __builtin_neon_vaddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 18); 5413 return __ret; 5414 } 5415 #endif 5416 5417 #ifdef __LITTLE_ENDIAN__ 5418 __ai __attribute__((target("neon"))) uint8x8_t vaddhn_u16(uint16x8_t __p0, uint16x8_t __p1) { 5419 uint8x8_t __ret; 5420 __ret = (uint8x8_t) __builtin_neon_vaddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 16); 5421 return __ret; 5422 } 5423 #else 5424 __ai __attribute__((target("neon"))) uint8x8_t vaddhn_u16(uint16x8_t __p0, uint16x8_t __p1) { 5425 uint8x8_t __ret; 5426 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 5427 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 5428 __ret = (uint8x8_t) __builtin_neon_vaddhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 16); 5429 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 5430 return __ret; 5431 } 5432 __ai __attribute__((target("neon"))) uint8x8_t __noswap_vaddhn_u16(uint16x8_t __p0, uint16x8_t __p1) { 5433 uint8x8_t __ret; 5434 __ret = (uint8x8_t) __builtin_neon_vaddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 16); 5435 return __ret; 5436 } 5437 #endif 5438 5439 #ifdef __LITTLE_ENDIAN__ 5440 __ai __attribute__((target("neon"))) int16x4_t vaddhn_s32(int32x4_t __p0, int32x4_t __p1) { 5441 int16x4_t __ret; 5442 __ret = (int16x4_t) __builtin_neon_vaddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 1); 5443 return __ret; 5444 } 5445 #else 5446 __ai __attribute__((target("neon"))) int16x4_t vaddhn_s32(int32x4_t __p0, int32x4_t __p1) { 5447 int16x4_t __ret; 5448 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 5449 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 5450 __ret = (int16x4_t) __builtin_neon_vaddhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 1); 5451 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 5452 return __ret; 5453 } 5454 __ai __attribute__((target("neon"))) int16x4_t __noswap_vaddhn_s32(int32x4_t __p0, int32x4_t __p1) { 5455 int16x4_t __ret; 5456 __ret = (int16x4_t) __builtin_neon_vaddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 1); 5457 return __ret; 5458 } 5459 #endif 5460 5461 #ifdef __LITTLE_ENDIAN__ 5462 __ai __attribute__((target("neon"))) int32x2_t vaddhn_s64(int64x2_t __p0, int64x2_t __p1) { 5463 int32x2_t __ret; 5464 __ret = (int32x2_t) __builtin_neon_vaddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 2); 5465 return __ret; 5466 } 5467 #else 5468 __ai __attribute__((target("neon"))) int32x2_t vaddhn_s64(int64x2_t __p0, int64x2_t __p1) { 5469 int32x2_t __ret; 5470 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 5471 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 5472 __ret = (int32x2_t) __builtin_neon_vaddhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 2); 5473 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 5474 return __ret; 5475 } 5476 __ai __attribute__((target("neon"))) int32x2_t __noswap_vaddhn_s64(int64x2_t __p0, int64x2_t __p1) { 5477 int32x2_t __ret; 5478 __ret = (int32x2_t) __builtin_neon_vaddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 2); 5479 return __ret; 5480 } 5481 #endif 5482 5483 #ifdef __LITTLE_ENDIAN__ 5484 __ai __attribute__((target("neon"))) int8x8_t vaddhn_s16(int16x8_t __p0, int16x8_t __p1) { 5485 int8x8_t __ret; 5486 __ret = (int8x8_t) __builtin_neon_vaddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 0); 5487 return __ret; 5488 } 5489 #else 5490 __ai __attribute__((target("neon"))) int8x8_t vaddhn_s16(int16x8_t __p0, int16x8_t __p1) { 5491 int8x8_t __ret; 5492 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 5493 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 5494 __ret = (int8x8_t) __builtin_neon_vaddhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 0); 5495 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 5496 return __ret; 5497 } 5498 __ai __attribute__((target("neon"))) int8x8_t __noswap_vaddhn_s16(int16x8_t __p0, int16x8_t __p1) { 5499 int8x8_t __ret; 5500 __ret = (int8x8_t) __builtin_neon_vaddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 0); 5501 return __ret; 5502 } 5503 #endif 5504 5505 #ifdef __LITTLE_ENDIAN__ 5506 __ai __attribute__((target("neon"))) uint8x16_t vandq_u8(uint8x16_t __p0, uint8x16_t __p1) { 5507 uint8x16_t __ret; 5508 __ret = __p0 & __p1; 5509 return __ret; 5510 } 5511 #else 5512 __ai __attribute__((target("neon"))) uint8x16_t vandq_u8(uint8x16_t __p0, uint8x16_t __p1) { 5513 uint8x16_t __ret; 5514 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 5515 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 5516 __ret = __rev0 & __rev1; 5517 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 5518 return __ret; 5519 } 5520 #endif 5521 5522 #ifdef __LITTLE_ENDIAN__ 5523 __ai __attribute__((target("neon"))) uint32x4_t vandq_u32(uint32x4_t __p0, uint32x4_t __p1) { 5524 uint32x4_t __ret; 5525 __ret = __p0 & __p1; 5526 return __ret; 5527 } 5528 #else 5529 __ai __attribute__((target("neon"))) uint32x4_t vandq_u32(uint32x4_t __p0, uint32x4_t __p1) { 5530 uint32x4_t __ret; 5531 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 5532 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 5533 __ret = __rev0 & __rev1; 5534 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 5535 return __ret; 5536 } 5537 #endif 5538 5539 #ifdef __LITTLE_ENDIAN__ 5540 __ai __attribute__((target("neon"))) uint64x2_t vandq_u64(uint64x2_t __p0, uint64x2_t __p1) { 5541 uint64x2_t __ret; 5542 __ret = __p0 & __p1; 5543 return __ret; 5544 } 5545 #else 5546 __ai __attribute__((target("neon"))) uint64x2_t vandq_u64(uint64x2_t __p0, uint64x2_t __p1) { 5547 uint64x2_t __ret; 5548 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 5549 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 5550 __ret = __rev0 & __rev1; 5551 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 5552 return __ret; 5553 } 5554 #endif 5555 5556 #ifdef __LITTLE_ENDIAN__ 5557 __ai __attribute__((target("neon"))) uint16x8_t vandq_u16(uint16x8_t __p0, uint16x8_t __p1) { 5558 uint16x8_t __ret; 5559 __ret = __p0 & __p1; 5560 return __ret; 5561 } 5562 #else 5563 __ai __attribute__((target("neon"))) uint16x8_t vandq_u16(uint16x8_t __p0, uint16x8_t __p1) { 5564 uint16x8_t __ret; 5565 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 5566 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 5567 __ret = __rev0 & __rev1; 5568 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 5569 return __ret; 5570 } 5571 #endif 5572 5573 #ifdef __LITTLE_ENDIAN__ 5574 __ai __attribute__((target("neon"))) int8x16_t vandq_s8(int8x16_t __p0, int8x16_t __p1) { 5575 int8x16_t __ret; 5576 __ret = __p0 & __p1; 5577 return __ret; 5578 } 5579 #else 5580 __ai __attribute__((target("neon"))) int8x16_t vandq_s8(int8x16_t __p0, int8x16_t __p1) { 5581 int8x16_t __ret; 5582 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 5583 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 5584 __ret = __rev0 & __rev1; 5585 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 5586 return __ret; 5587 } 5588 #endif 5589 5590 #ifdef __LITTLE_ENDIAN__ 5591 __ai __attribute__((target("neon"))) int32x4_t vandq_s32(int32x4_t __p0, int32x4_t __p1) { 5592 int32x4_t __ret; 5593 __ret = __p0 & __p1; 5594 return __ret; 5595 } 5596 #else 5597 __ai __attribute__((target("neon"))) int32x4_t vandq_s32(int32x4_t __p0, int32x4_t __p1) { 5598 int32x4_t __ret; 5599 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 5600 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 5601 __ret = __rev0 & __rev1; 5602 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 5603 return __ret; 5604 } 5605 #endif 5606 5607 #ifdef __LITTLE_ENDIAN__ 5608 __ai __attribute__((target("neon"))) int64x2_t vandq_s64(int64x2_t __p0, int64x2_t __p1) { 5609 int64x2_t __ret; 5610 __ret = __p0 & __p1; 5611 return __ret; 5612 } 5613 #else 5614 __ai __attribute__((target("neon"))) int64x2_t vandq_s64(int64x2_t __p0, int64x2_t __p1) { 5615 int64x2_t __ret; 5616 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 5617 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 5618 __ret = __rev0 & __rev1; 5619 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 5620 return __ret; 5621 } 5622 #endif 5623 5624 #ifdef __LITTLE_ENDIAN__ 5625 __ai __attribute__((target("neon"))) int16x8_t vandq_s16(int16x8_t __p0, int16x8_t __p1) { 5626 int16x8_t __ret; 5627 __ret = __p0 & __p1; 5628 return __ret; 5629 } 5630 #else 5631 __ai __attribute__((target("neon"))) int16x8_t vandq_s16(int16x8_t __p0, int16x8_t __p1) { 5632 int16x8_t __ret; 5633 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 5634 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 5635 __ret = __rev0 & __rev1; 5636 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 5637 return __ret; 5638 } 5639 #endif 5640 5641 #ifdef __LITTLE_ENDIAN__ 5642 __ai __attribute__((target("neon"))) uint8x8_t vand_u8(uint8x8_t __p0, uint8x8_t __p1) { 5643 uint8x8_t __ret; 5644 __ret = __p0 & __p1; 5645 return __ret; 5646 } 5647 #else 5648 __ai __attribute__((target("neon"))) uint8x8_t vand_u8(uint8x8_t __p0, uint8x8_t __p1) { 5649 uint8x8_t __ret; 5650 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 5651 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 5652 __ret = __rev0 & __rev1; 5653 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 5654 return __ret; 5655 } 5656 #endif 5657 5658 #ifdef __LITTLE_ENDIAN__ 5659 __ai __attribute__((target("neon"))) uint32x2_t vand_u32(uint32x2_t __p0, uint32x2_t __p1) { 5660 uint32x2_t __ret; 5661 __ret = __p0 & __p1; 5662 return __ret; 5663 } 5664 #else 5665 __ai __attribute__((target("neon"))) uint32x2_t vand_u32(uint32x2_t __p0, uint32x2_t __p1) { 5666 uint32x2_t __ret; 5667 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 5668 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 5669 __ret = __rev0 & __rev1; 5670 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 5671 return __ret; 5672 } 5673 #endif 5674 5675 __ai __attribute__((target("neon"))) uint64x1_t vand_u64(uint64x1_t __p0, uint64x1_t __p1) { 5676 uint64x1_t __ret; 5677 __ret = __p0 & __p1; 5678 return __ret; 5679 } 5680 #ifdef __LITTLE_ENDIAN__ 5681 __ai __attribute__((target("neon"))) uint16x4_t vand_u16(uint16x4_t __p0, uint16x4_t __p1) { 5682 uint16x4_t __ret; 5683 __ret = __p0 & __p1; 5684 return __ret; 5685 } 5686 #else 5687 __ai __attribute__((target("neon"))) uint16x4_t vand_u16(uint16x4_t __p0, uint16x4_t __p1) { 5688 uint16x4_t __ret; 5689 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 5690 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 5691 __ret = __rev0 & __rev1; 5692 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 5693 return __ret; 5694 } 5695 #endif 5696 5697 #ifdef __LITTLE_ENDIAN__ 5698 __ai __attribute__((target("neon"))) int8x8_t vand_s8(int8x8_t __p0, int8x8_t __p1) { 5699 int8x8_t __ret; 5700 __ret = __p0 & __p1; 5701 return __ret; 5702 } 5703 #else 5704 __ai __attribute__((target("neon"))) int8x8_t vand_s8(int8x8_t __p0, int8x8_t __p1) { 5705 int8x8_t __ret; 5706 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 5707 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 5708 __ret = __rev0 & __rev1; 5709 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 5710 return __ret; 5711 } 5712 #endif 5713 5714 #ifdef __LITTLE_ENDIAN__ 5715 __ai __attribute__((target("neon"))) int32x2_t vand_s32(int32x2_t __p0, int32x2_t __p1) { 5716 int32x2_t __ret; 5717 __ret = __p0 & __p1; 5718 return __ret; 5719 } 5720 #else 5721 __ai __attribute__((target("neon"))) int32x2_t vand_s32(int32x2_t __p0, int32x2_t __p1) { 5722 int32x2_t __ret; 5723 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 5724 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 5725 __ret = __rev0 & __rev1; 5726 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 5727 return __ret; 5728 } 5729 #endif 5730 5731 __ai __attribute__((target("neon"))) int64x1_t vand_s64(int64x1_t __p0, int64x1_t __p1) { 5732 int64x1_t __ret; 5733 __ret = __p0 & __p1; 5734 return __ret; 5735 } 5736 #ifdef __LITTLE_ENDIAN__ 5737 __ai __attribute__((target("neon"))) int16x4_t vand_s16(int16x4_t __p0, int16x4_t __p1) { 5738 int16x4_t __ret; 5739 __ret = __p0 & __p1; 5740 return __ret; 5741 } 5742 #else 5743 __ai __attribute__((target("neon"))) int16x4_t vand_s16(int16x4_t __p0, int16x4_t __p1) { 5744 int16x4_t __ret; 5745 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 5746 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 5747 __ret = __rev0 & __rev1; 5748 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 5749 return __ret; 5750 } 5751 #endif 5752 5753 #ifdef __LITTLE_ENDIAN__ 5754 __ai __attribute__((target("neon"))) uint8x16_t vbicq_u8(uint8x16_t __p0, uint8x16_t __p1) { 5755 uint8x16_t __ret; 5756 __ret = __p0 & ~__p1; 5757 return __ret; 5758 } 5759 #else 5760 __ai __attribute__((target("neon"))) uint8x16_t vbicq_u8(uint8x16_t __p0, uint8x16_t __p1) { 5761 uint8x16_t __ret; 5762 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 5763 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 5764 __ret = __rev0 & ~__rev1; 5765 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 5766 return __ret; 5767 } 5768 #endif 5769 5770 #ifdef __LITTLE_ENDIAN__ 5771 __ai __attribute__((target("neon"))) uint32x4_t vbicq_u32(uint32x4_t __p0, uint32x4_t __p1) { 5772 uint32x4_t __ret; 5773 __ret = __p0 & ~__p1; 5774 return __ret; 5775 } 5776 #else 5777 __ai __attribute__((target("neon"))) uint32x4_t vbicq_u32(uint32x4_t __p0, uint32x4_t __p1) { 5778 uint32x4_t __ret; 5779 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 5780 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 5781 __ret = __rev0 & ~__rev1; 5782 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 5783 return __ret; 5784 } 5785 #endif 5786 5787 #ifdef __LITTLE_ENDIAN__ 5788 __ai __attribute__((target("neon"))) uint64x2_t vbicq_u64(uint64x2_t __p0, uint64x2_t __p1) { 5789 uint64x2_t __ret; 5790 __ret = __p0 & ~__p1; 5791 return __ret; 5792 } 5793 #else 5794 __ai __attribute__((target("neon"))) uint64x2_t vbicq_u64(uint64x2_t __p0, uint64x2_t __p1) { 5795 uint64x2_t __ret; 5796 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 5797 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 5798 __ret = __rev0 & ~__rev1; 5799 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 5800 return __ret; 5801 } 5802 #endif 5803 5804 #ifdef __LITTLE_ENDIAN__ 5805 __ai __attribute__((target("neon"))) uint16x8_t vbicq_u16(uint16x8_t __p0, uint16x8_t __p1) { 5806 uint16x8_t __ret; 5807 __ret = __p0 & ~__p1; 5808 return __ret; 5809 } 5810 #else 5811 __ai __attribute__((target("neon"))) uint16x8_t vbicq_u16(uint16x8_t __p0, uint16x8_t __p1) { 5812 uint16x8_t __ret; 5813 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 5814 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 5815 __ret = __rev0 & ~__rev1; 5816 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 5817 return __ret; 5818 } 5819 #endif 5820 5821 #ifdef __LITTLE_ENDIAN__ 5822 __ai __attribute__((target("neon"))) int8x16_t vbicq_s8(int8x16_t __p0, int8x16_t __p1) { 5823 int8x16_t __ret; 5824 __ret = __p0 & ~__p1; 5825 return __ret; 5826 } 5827 #else 5828 __ai __attribute__((target("neon"))) int8x16_t vbicq_s8(int8x16_t __p0, int8x16_t __p1) { 5829 int8x16_t __ret; 5830 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 5831 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 5832 __ret = __rev0 & ~__rev1; 5833 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 5834 return __ret; 5835 } 5836 #endif 5837 5838 #ifdef __LITTLE_ENDIAN__ 5839 __ai __attribute__((target("neon"))) int32x4_t vbicq_s32(int32x4_t __p0, int32x4_t __p1) { 5840 int32x4_t __ret; 5841 __ret = __p0 & ~__p1; 5842 return __ret; 5843 } 5844 #else 5845 __ai __attribute__((target("neon"))) int32x4_t vbicq_s32(int32x4_t __p0, int32x4_t __p1) { 5846 int32x4_t __ret; 5847 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 5848 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 5849 __ret = __rev0 & ~__rev1; 5850 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 5851 return __ret; 5852 } 5853 #endif 5854 5855 #ifdef __LITTLE_ENDIAN__ 5856 __ai __attribute__((target("neon"))) int64x2_t vbicq_s64(int64x2_t __p0, int64x2_t __p1) { 5857 int64x2_t __ret; 5858 __ret = __p0 & ~__p1; 5859 return __ret; 5860 } 5861 #else 5862 __ai __attribute__((target("neon"))) int64x2_t vbicq_s64(int64x2_t __p0, int64x2_t __p1) { 5863 int64x2_t __ret; 5864 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 5865 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 5866 __ret = __rev0 & ~__rev1; 5867 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 5868 return __ret; 5869 } 5870 #endif 5871 5872 #ifdef __LITTLE_ENDIAN__ 5873 __ai __attribute__((target("neon"))) int16x8_t vbicq_s16(int16x8_t __p0, int16x8_t __p1) { 5874 int16x8_t __ret; 5875 __ret = __p0 & ~__p1; 5876 return __ret; 5877 } 5878 #else 5879 __ai __attribute__((target("neon"))) int16x8_t vbicq_s16(int16x8_t __p0, int16x8_t __p1) { 5880 int16x8_t __ret; 5881 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 5882 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 5883 __ret = __rev0 & ~__rev1; 5884 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 5885 return __ret; 5886 } 5887 #endif 5888 5889 #ifdef __LITTLE_ENDIAN__ 5890 __ai __attribute__((target("neon"))) uint8x8_t vbic_u8(uint8x8_t __p0, uint8x8_t __p1) { 5891 uint8x8_t __ret; 5892 __ret = __p0 & ~__p1; 5893 return __ret; 5894 } 5895 #else 5896 __ai __attribute__((target("neon"))) uint8x8_t vbic_u8(uint8x8_t __p0, uint8x8_t __p1) { 5897 uint8x8_t __ret; 5898 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 5899 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 5900 __ret = __rev0 & ~__rev1; 5901 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 5902 return __ret; 5903 } 5904 #endif 5905 5906 #ifdef __LITTLE_ENDIAN__ 5907 __ai __attribute__((target("neon"))) uint32x2_t vbic_u32(uint32x2_t __p0, uint32x2_t __p1) { 5908 uint32x2_t __ret; 5909 __ret = __p0 & ~__p1; 5910 return __ret; 5911 } 5912 #else 5913 __ai __attribute__((target("neon"))) uint32x2_t vbic_u32(uint32x2_t __p0, uint32x2_t __p1) { 5914 uint32x2_t __ret; 5915 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 5916 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 5917 __ret = __rev0 & ~__rev1; 5918 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 5919 return __ret; 5920 } 5921 #endif 5922 5923 __ai __attribute__((target("neon"))) uint64x1_t vbic_u64(uint64x1_t __p0, uint64x1_t __p1) { 5924 uint64x1_t __ret; 5925 __ret = __p0 & ~__p1; 5926 return __ret; 5927 } 5928 #ifdef __LITTLE_ENDIAN__ 5929 __ai __attribute__((target("neon"))) uint16x4_t vbic_u16(uint16x4_t __p0, uint16x4_t __p1) { 5930 uint16x4_t __ret; 5931 __ret = __p0 & ~__p1; 5932 return __ret; 5933 } 5934 #else 5935 __ai __attribute__((target("neon"))) uint16x4_t vbic_u16(uint16x4_t __p0, uint16x4_t __p1) { 5936 uint16x4_t __ret; 5937 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 5938 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 5939 __ret = __rev0 & ~__rev1; 5940 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 5941 return __ret; 5942 } 5943 #endif 5944 5945 #ifdef __LITTLE_ENDIAN__ 5946 __ai __attribute__((target("neon"))) int8x8_t vbic_s8(int8x8_t __p0, int8x8_t __p1) { 5947 int8x8_t __ret; 5948 __ret = __p0 & ~__p1; 5949 return __ret; 5950 } 5951 #else 5952 __ai __attribute__((target("neon"))) int8x8_t vbic_s8(int8x8_t __p0, int8x8_t __p1) { 5953 int8x8_t __ret; 5954 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 5955 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 5956 __ret = __rev0 & ~__rev1; 5957 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 5958 return __ret; 5959 } 5960 #endif 5961 5962 #ifdef __LITTLE_ENDIAN__ 5963 __ai __attribute__((target("neon"))) int32x2_t vbic_s32(int32x2_t __p0, int32x2_t __p1) { 5964 int32x2_t __ret; 5965 __ret = __p0 & ~__p1; 5966 return __ret; 5967 } 5968 #else 5969 __ai __attribute__((target("neon"))) int32x2_t vbic_s32(int32x2_t __p0, int32x2_t __p1) { 5970 int32x2_t __ret; 5971 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 5972 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 5973 __ret = __rev0 & ~__rev1; 5974 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 5975 return __ret; 5976 } 5977 #endif 5978 5979 __ai __attribute__((target("neon"))) int64x1_t vbic_s64(int64x1_t __p0, int64x1_t __p1) { 5980 int64x1_t __ret; 5981 __ret = __p0 & ~__p1; 5982 return __ret; 5983 } 5984 #ifdef __LITTLE_ENDIAN__ 5985 __ai __attribute__((target("neon"))) int16x4_t vbic_s16(int16x4_t __p0, int16x4_t __p1) { 5986 int16x4_t __ret; 5987 __ret = __p0 & ~__p1; 5988 return __ret; 5989 } 5990 #else 5991 __ai __attribute__((target("neon"))) int16x4_t vbic_s16(int16x4_t __p0, int16x4_t __p1) { 5992 int16x4_t __ret; 5993 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 5994 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 5995 __ret = __rev0 & ~__rev1; 5996 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 5997 return __ret; 5998 } 5999 #endif 6000 6001 #ifdef __LITTLE_ENDIAN__ 6002 __ai __attribute__((target("neon"))) poly8x8_t vbsl_p8(uint8x8_t __p0, poly8x8_t __p1, poly8x8_t __p2) { 6003 poly8x8_t __ret; 6004 __ret = (poly8x8_t) __builtin_neon_vbsl_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 4); 6005 return __ret; 6006 } 6007 #else 6008 __ai __attribute__((target("neon"))) poly8x8_t vbsl_p8(uint8x8_t __p0, poly8x8_t __p1, poly8x8_t __p2) { 6009 poly8x8_t __ret; 6010 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 6011 poly8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 6012 poly8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 6013 __ret = (poly8x8_t) __builtin_neon_vbsl_v((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 4); 6014 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 6015 return __ret; 6016 } 6017 #endif 6018 6019 #ifdef __LITTLE_ENDIAN__ 6020 __ai __attribute__((target("neon"))) poly16x4_t vbsl_p16(uint16x4_t __p0, poly16x4_t __p1, poly16x4_t __p2) { 6021 poly16x4_t __ret; 6022 __ret = (poly16x4_t) __builtin_neon_vbsl_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 5); 6023 return __ret; 6024 } 6025 #else 6026 __ai __attribute__((target("neon"))) poly16x4_t vbsl_p16(uint16x4_t __p0, poly16x4_t __p1, poly16x4_t __p2) { 6027 poly16x4_t __ret; 6028 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 6029 poly16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 6030 poly16x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 6031 __ret = (poly16x4_t) __builtin_neon_vbsl_v((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 5); 6032 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 6033 return __ret; 6034 } 6035 #endif 6036 6037 #ifdef __LITTLE_ENDIAN__ 6038 __ai __attribute__((target("neon"))) poly8x16_t vbslq_p8(uint8x16_t __p0, poly8x16_t __p1, poly8x16_t __p2) { 6039 poly8x16_t __ret; 6040 __ret = (poly8x16_t) __builtin_neon_vbslq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 36); 6041 return __ret; 6042 } 6043 #else 6044 __ai __attribute__((target("neon"))) poly8x16_t vbslq_p8(uint8x16_t __p0, poly8x16_t __p1, poly8x16_t __p2) { 6045 poly8x16_t __ret; 6046 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 6047 poly8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 6048 poly8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 6049 __ret = (poly8x16_t) __builtin_neon_vbslq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 36); 6050 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 6051 return __ret; 6052 } 6053 #endif 6054 6055 #ifdef __LITTLE_ENDIAN__ 6056 __ai __attribute__((target("neon"))) poly16x8_t vbslq_p16(uint16x8_t __p0, poly16x8_t __p1, poly16x8_t __p2) { 6057 poly16x8_t __ret; 6058 __ret = (poly16x8_t) __builtin_neon_vbslq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 37); 6059 return __ret; 6060 } 6061 #else 6062 __ai __attribute__((target("neon"))) poly16x8_t vbslq_p16(uint16x8_t __p0, poly16x8_t __p1, poly16x8_t __p2) { 6063 poly16x8_t __ret; 6064 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 6065 poly16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 6066 poly16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 6067 __ret = (poly16x8_t) __builtin_neon_vbslq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 37); 6068 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 6069 return __ret; 6070 } 6071 #endif 6072 6073 #ifdef __LITTLE_ENDIAN__ 6074 __ai __attribute__((target("neon"))) uint8x16_t vbslq_u8(uint8x16_t __p0, uint8x16_t __p1, uint8x16_t __p2) { 6075 uint8x16_t __ret; 6076 __ret = (uint8x16_t) __builtin_neon_vbslq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 48); 6077 return __ret; 6078 } 6079 #else 6080 __ai __attribute__((target("neon"))) uint8x16_t vbslq_u8(uint8x16_t __p0, uint8x16_t __p1, uint8x16_t __p2) { 6081 uint8x16_t __ret; 6082 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 6083 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 6084 uint8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 6085 __ret = (uint8x16_t) __builtin_neon_vbslq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 48); 6086 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 6087 return __ret; 6088 } 6089 #endif 6090 6091 #ifdef __LITTLE_ENDIAN__ 6092 __ai __attribute__((target("neon"))) uint32x4_t vbslq_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 6093 uint32x4_t __ret; 6094 __ret = (uint32x4_t) __builtin_neon_vbslq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 50); 6095 return __ret; 6096 } 6097 #else 6098 __ai __attribute__((target("neon"))) uint32x4_t vbslq_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 6099 uint32x4_t __ret; 6100 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 6101 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 6102 uint32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 6103 __ret = (uint32x4_t) __builtin_neon_vbslq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 50); 6104 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 6105 return __ret; 6106 } 6107 #endif 6108 6109 #ifdef __LITTLE_ENDIAN__ 6110 __ai __attribute__((target("neon"))) uint64x2_t vbslq_u64(uint64x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) { 6111 uint64x2_t __ret; 6112 __ret = (uint64x2_t) __builtin_neon_vbslq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 51); 6113 return __ret; 6114 } 6115 #else 6116 __ai __attribute__((target("neon"))) uint64x2_t vbslq_u64(uint64x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) { 6117 uint64x2_t __ret; 6118 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 6119 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 6120 uint64x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 6121 __ret = (uint64x2_t) __builtin_neon_vbslq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 51); 6122 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 6123 return __ret; 6124 } 6125 #endif 6126 6127 #ifdef __LITTLE_ENDIAN__ 6128 __ai __attribute__((target("neon"))) uint16x8_t vbslq_u16(uint16x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) { 6129 uint16x8_t __ret; 6130 __ret = (uint16x8_t) __builtin_neon_vbslq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 49); 6131 return __ret; 6132 } 6133 #else 6134 __ai __attribute__((target("neon"))) uint16x8_t vbslq_u16(uint16x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) { 6135 uint16x8_t __ret; 6136 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 6137 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 6138 uint16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 6139 __ret = (uint16x8_t) __builtin_neon_vbslq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 49); 6140 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 6141 return __ret; 6142 } 6143 #endif 6144 6145 #ifdef __LITTLE_ENDIAN__ 6146 __ai __attribute__((target("neon"))) int8x16_t vbslq_s8(uint8x16_t __p0, int8x16_t __p1, int8x16_t __p2) { 6147 int8x16_t __ret; 6148 __ret = (int8x16_t) __builtin_neon_vbslq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 32); 6149 return __ret; 6150 } 6151 #else 6152 __ai __attribute__((target("neon"))) int8x16_t vbslq_s8(uint8x16_t __p0, int8x16_t __p1, int8x16_t __p2) { 6153 int8x16_t __ret; 6154 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 6155 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 6156 int8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 6157 __ret = (int8x16_t) __builtin_neon_vbslq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 32); 6158 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 6159 return __ret; 6160 } 6161 #endif 6162 6163 #ifdef __LITTLE_ENDIAN__ 6164 __ai __attribute__((target("neon"))) float32x4_t vbslq_f32(uint32x4_t __p0, float32x4_t __p1, float32x4_t __p2) { 6165 float32x4_t __ret; 6166 __ret = (float32x4_t) __builtin_neon_vbslq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41); 6167 return __ret; 6168 } 6169 #else 6170 __ai __attribute__((target("neon"))) float32x4_t vbslq_f32(uint32x4_t __p0, float32x4_t __p1, float32x4_t __p2) { 6171 float32x4_t __ret; 6172 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 6173 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 6174 float32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 6175 __ret = (float32x4_t) __builtin_neon_vbslq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 41); 6176 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 6177 return __ret; 6178 } 6179 #endif 6180 6181 #ifdef __LITTLE_ENDIAN__ 6182 __ai __attribute__((target("neon"))) int32x4_t vbslq_s32(uint32x4_t __p0, int32x4_t __p1, int32x4_t __p2) { 6183 int32x4_t __ret; 6184 __ret = (int32x4_t) __builtin_neon_vbslq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 34); 6185 return __ret; 6186 } 6187 #else 6188 __ai __attribute__((target("neon"))) int32x4_t vbslq_s32(uint32x4_t __p0, int32x4_t __p1, int32x4_t __p2) { 6189 int32x4_t __ret; 6190 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 6191 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 6192 int32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 6193 __ret = (int32x4_t) __builtin_neon_vbslq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 34); 6194 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 6195 return __ret; 6196 } 6197 #endif 6198 6199 #ifdef __LITTLE_ENDIAN__ 6200 __ai __attribute__((target("neon"))) int64x2_t vbslq_s64(uint64x2_t __p0, int64x2_t __p1, int64x2_t __p2) { 6201 int64x2_t __ret; 6202 __ret = (int64x2_t) __builtin_neon_vbslq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 35); 6203 return __ret; 6204 } 6205 #else 6206 __ai __attribute__((target("neon"))) int64x2_t vbslq_s64(uint64x2_t __p0, int64x2_t __p1, int64x2_t __p2) { 6207 int64x2_t __ret; 6208 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 6209 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 6210 int64x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 6211 __ret = (int64x2_t) __builtin_neon_vbslq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 35); 6212 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 6213 return __ret; 6214 } 6215 #endif 6216 6217 #ifdef __LITTLE_ENDIAN__ 6218 __ai __attribute__((target("neon"))) int16x8_t vbslq_s16(uint16x8_t __p0, int16x8_t __p1, int16x8_t __p2) { 6219 int16x8_t __ret; 6220 __ret = (int16x8_t) __builtin_neon_vbslq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 33); 6221 return __ret; 6222 } 6223 #else 6224 __ai __attribute__((target("neon"))) int16x8_t vbslq_s16(uint16x8_t __p0, int16x8_t __p1, int16x8_t __p2) { 6225 int16x8_t __ret; 6226 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 6227 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 6228 int16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 6229 __ret = (int16x8_t) __builtin_neon_vbslq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 33); 6230 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 6231 return __ret; 6232 } 6233 #endif 6234 6235 #ifdef __LITTLE_ENDIAN__ 6236 __ai __attribute__((target("neon"))) uint8x8_t vbsl_u8(uint8x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) { 6237 uint8x8_t __ret; 6238 __ret = (uint8x8_t) __builtin_neon_vbsl_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 16); 6239 return __ret; 6240 } 6241 #else 6242 __ai __attribute__((target("neon"))) uint8x8_t vbsl_u8(uint8x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) { 6243 uint8x8_t __ret; 6244 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 6245 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 6246 uint8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 6247 __ret = (uint8x8_t) __builtin_neon_vbsl_v((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 16); 6248 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 6249 return __ret; 6250 } 6251 #endif 6252 6253 #ifdef __LITTLE_ENDIAN__ 6254 __ai __attribute__((target("neon"))) uint32x2_t vbsl_u32(uint32x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) { 6255 uint32x2_t __ret; 6256 __ret = (uint32x2_t) __builtin_neon_vbsl_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 18); 6257 return __ret; 6258 } 6259 #else 6260 __ai __attribute__((target("neon"))) uint32x2_t vbsl_u32(uint32x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) { 6261 uint32x2_t __ret; 6262 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 6263 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 6264 uint32x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 6265 __ret = (uint32x2_t) __builtin_neon_vbsl_v((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 18); 6266 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 6267 return __ret; 6268 } 6269 #endif 6270 6271 __ai __attribute__((target("neon"))) uint64x1_t vbsl_u64(uint64x1_t __p0, uint64x1_t __p1, uint64x1_t __p2) { 6272 uint64x1_t __ret; 6273 __ret = (uint64x1_t) __builtin_neon_vbsl_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 19); 6274 return __ret; 6275 } 6276 #ifdef __LITTLE_ENDIAN__ 6277 __ai __attribute__((target("neon"))) uint16x4_t vbsl_u16(uint16x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) { 6278 uint16x4_t __ret; 6279 __ret = (uint16x4_t) __builtin_neon_vbsl_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 17); 6280 return __ret; 6281 } 6282 #else 6283 __ai __attribute__((target("neon"))) uint16x4_t vbsl_u16(uint16x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) { 6284 uint16x4_t __ret; 6285 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 6286 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 6287 uint16x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 6288 __ret = (uint16x4_t) __builtin_neon_vbsl_v((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 17); 6289 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 6290 return __ret; 6291 } 6292 #endif 6293 6294 #ifdef __LITTLE_ENDIAN__ 6295 __ai __attribute__((target("neon"))) int8x8_t vbsl_s8(uint8x8_t __p0, int8x8_t __p1, int8x8_t __p2) { 6296 int8x8_t __ret; 6297 __ret = (int8x8_t) __builtin_neon_vbsl_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 0); 6298 return __ret; 6299 } 6300 #else 6301 __ai __attribute__((target("neon"))) int8x8_t vbsl_s8(uint8x8_t __p0, int8x8_t __p1, int8x8_t __p2) { 6302 int8x8_t __ret; 6303 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 6304 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 6305 int8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 6306 __ret = (int8x8_t) __builtin_neon_vbsl_v((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 0); 6307 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 6308 return __ret; 6309 } 6310 #endif 6311 6312 #ifdef __LITTLE_ENDIAN__ 6313 __ai __attribute__((target("neon"))) float32x2_t vbsl_f32(uint32x2_t __p0, float32x2_t __p1, float32x2_t __p2) { 6314 float32x2_t __ret; 6315 __ret = (float32x2_t) __builtin_neon_vbsl_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9); 6316 return __ret; 6317 } 6318 #else 6319 __ai __attribute__((target("neon"))) float32x2_t vbsl_f32(uint32x2_t __p0, float32x2_t __p1, float32x2_t __p2) { 6320 float32x2_t __ret; 6321 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 6322 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 6323 float32x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 6324 __ret = (float32x2_t) __builtin_neon_vbsl_v((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 9); 6325 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 6326 return __ret; 6327 } 6328 #endif 6329 6330 #ifdef __LITTLE_ENDIAN__ 6331 __ai __attribute__((target("neon"))) int32x2_t vbsl_s32(uint32x2_t __p0, int32x2_t __p1, int32x2_t __p2) { 6332 int32x2_t __ret; 6333 __ret = (int32x2_t) __builtin_neon_vbsl_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 2); 6334 return __ret; 6335 } 6336 #else 6337 __ai __attribute__((target("neon"))) int32x2_t vbsl_s32(uint32x2_t __p0, int32x2_t __p1, int32x2_t __p2) { 6338 int32x2_t __ret; 6339 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 6340 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 6341 int32x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 6342 __ret = (int32x2_t) __builtin_neon_vbsl_v((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 2); 6343 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 6344 return __ret; 6345 } 6346 #endif 6347 6348 __ai __attribute__((target("neon"))) int64x1_t vbsl_s64(uint64x1_t __p0, int64x1_t __p1, int64x1_t __p2) { 6349 int64x1_t __ret; 6350 __ret = (int64x1_t) __builtin_neon_vbsl_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 3); 6351 return __ret; 6352 } 6353 #ifdef __LITTLE_ENDIAN__ 6354 __ai __attribute__((target("neon"))) int16x4_t vbsl_s16(uint16x4_t __p0, int16x4_t __p1, int16x4_t __p2) { 6355 int16x4_t __ret; 6356 __ret = (int16x4_t) __builtin_neon_vbsl_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 1); 6357 return __ret; 6358 } 6359 #else 6360 __ai __attribute__((target("neon"))) int16x4_t vbsl_s16(uint16x4_t __p0, int16x4_t __p1, int16x4_t __p2) { 6361 int16x4_t __ret; 6362 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 6363 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 6364 int16x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 6365 __ret = (int16x4_t) __builtin_neon_vbsl_v((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 1); 6366 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 6367 return __ret; 6368 } 6369 #endif 6370 6371 #ifdef __LITTLE_ENDIAN__ 6372 __ai __attribute__((target("neon"))) float16x8_t vbslq_f16(uint16x8_t __p0, float16x8_t __p1, float16x8_t __p2) { 6373 float16x8_t __ret; 6374 __ret = (float16x8_t) __builtin_neon_vbslq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 40); 6375 return __ret; 6376 } 6377 #else 6378 __ai __attribute__((target("neon"))) float16x8_t vbslq_f16(uint16x8_t __p0, float16x8_t __p1, float16x8_t __p2) { 6379 float16x8_t __ret; 6380 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 6381 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 6382 float16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 6383 __ret = (float16x8_t) __builtin_neon_vbslq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 40); 6384 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 6385 return __ret; 6386 } 6387 #endif 6388 6389 #ifdef __LITTLE_ENDIAN__ 6390 __ai __attribute__((target("neon"))) float16x4_t vbsl_f16(uint16x4_t __p0, float16x4_t __p1, float16x4_t __p2) { 6391 float16x4_t __ret; 6392 __ret = (float16x4_t) __builtin_neon_vbsl_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 8); 6393 return __ret; 6394 } 6395 #else 6396 __ai __attribute__((target("neon"))) float16x4_t vbsl_f16(uint16x4_t __p0, float16x4_t __p1, float16x4_t __p2) { 6397 float16x4_t __ret; 6398 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 6399 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 6400 float16x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 6401 __ret = (float16x4_t) __builtin_neon_vbsl_v((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 8); 6402 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 6403 return __ret; 6404 } 6405 #endif 6406 6407 #ifdef __LITTLE_ENDIAN__ 6408 __ai __attribute__((target("neon"))) uint32x4_t vcageq_f32(float32x4_t __p0, float32x4_t __p1) { 6409 uint32x4_t __ret; 6410 __ret = (uint32x4_t) __builtin_neon_vcageq_v((int8x16_t)__p0, (int8x16_t)__p1, 50); 6411 return __ret; 6412 } 6413 #else 6414 __ai __attribute__((target("neon"))) uint32x4_t vcageq_f32(float32x4_t __p0, float32x4_t __p1) { 6415 uint32x4_t __ret; 6416 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 6417 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 6418 __ret = (uint32x4_t) __builtin_neon_vcageq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50); 6419 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 6420 return __ret; 6421 } 6422 #endif 6423 6424 #ifdef __LITTLE_ENDIAN__ 6425 __ai __attribute__((target("neon"))) uint32x2_t vcage_f32(float32x2_t __p0, float32x2_t __p1) { 6426 uint32x2_t __ret; 6427 __ret = (uint32x2_t) __builtin_neon_vcage_v((int8x8_t)__p0, (int8x8_t)__p1, 18); 6428 return __ret; 6429 } 6430 #else 6431 __ai __attribute__((target("neon"))) uint32x2_t vcage_f32(float32x2_t __p0, float32x2_t __p1) { 6432 uint32x2_t __ret; 6433 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 6434 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 6435 __ret = (uint32x2_t) __builtin_neon_vcage_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18); 6436 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 6437 return __ret; 6438 } 6439 #endif 6440 6441 #ifdef __LITTLE_ENDIAN__ 6442 __ai __attribute__((target("neon"))) uint32x4_t vcagtq_f32(float32x4_t __p0, float32x4_t __p1) { 6443 uint32x4_t __ret; 6444 __ret = (uint32x4_t) __builtin_neon_vcagtq_v((int8x16_t)__p0, (int8x16_t)__p1, 50); 6445 return __ret; 6446 } 6447 #else 6448 __ai __attribute__((target("neon"))) uint32x4_t vcagtq_f32(float32x4_t __p0, float32x4_t __p1) { 6449 uint32x4_t __ret; 6450 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 6451 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 6452 __ret = (uint32x4_t) __builtin_neon_vcagtq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50); 6453 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 6454 return __ret; 6455 } 6456 #endif 6457 6458 #ifdef __LITTLE_ENDIAN__ 6459 __ai __attribute__((target("neon"))) uint32x2_t vcagt_f32(float32x2_t __p0, float32x2_t __p1) { 6460 uint32x2_t __ret; 6461 __ret = (uint32x2_t) __builtin_neon_vcagt_v((int8x8_t)__p0, (int8x8_t)__p1, 18); 6462 return __ret; 6463 } 6464 #else 6465 __ai __attribute__((target("neon"))) uint32x2_t vcagt_f32(float32x2_t __p0, float32x2_t __p1) { 6466 uint32x2_t __ret; 6467 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 6468 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 6469 __ret = (uint32x2_t) __builtin_neon_vcagt_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18); 6470 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 6471 return __ret; 6472 } 6473 #endif 6474 6475 #ifdef __LITTLE_ENDIAN__ 6476 __ai __attribute__((target("neon"))) uint32x4_t vcaleq_f32(float32x4_t __p0, float32x4_t __p1) { 6477 uint32x4_t __ret; 6478 __ret = (uint32x4_t) __builtin_neon_vcaleq_v((int8x16_t)__p0, (int8x16_t)__p1, 50); 6479 return __ret; 6480 } 6481 #else 6482 __ai __attribute__((target("neon"))) uint32x4_t vcaleq_f32(float32x4_t __p0, float32x4_t __p1) { 6483 uint32x4_t __ret; 6484 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 6485 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 6486 __ret = (uint32x4_t) __builtin_neon_vcaleq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50); 6487 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 6488 return __ret; 6489 } 6490 #endif 6491 6492 #ifdef __LITTLE_ENDIAN__ 6493 __ai __attribute__((target("neon"))) uint32x2_t vcale_f32(float32x2_t __p0, float32x2_t __p1) { 6494 uint32x2_t __ret; 6495 __ret = (uint32x2_t) __builtin_neon_vcale_v((int8x8_t)__p0, (int8x8_t)__p1, 18); 6496 return __ret; 6497 } 6498 #else 6499 __ai __attribute__((target("neon"))) uint32x2_t vcale_f32(float32x2_t __p0, float32x2_t __p1) { 6500 uint32x2_t __ret; 6501 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 6502 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 6503 __ret = (uint32x2_t) __builtin_neon_vcale_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18); 6504 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 6505 return __ret; 6506 } 6507 #endif 6508 6509 #ifdef __LITTLE_ENDIAN__ 6510 __ai __attribute__((target("neon"))) uint32x4_t vcaltq_f32(float32x4_t __p0, float32x4_t __p1) { 6511 uint32x4_t __ret; 6512 __ret = (uint32x4_t) __builtin_neon_vcaltq_v((int8x16_t)__p0, (int8x16_t)__p1, 50); 6513 return __ret; 6514 } 6515 #else 6516 __ai __attribute__((target("neon"))) uint32x4_t vcaltq_f32(float32x4_t __p0, float32x4_t __p1) { 6517 uint32x4_t __ret; 6518 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 6519 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 6520 __ret = (uint32x4_t) __builtin_neon_vcaltq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50); 6521 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 6522 return __ret; 6523 } 6524 #endif 6525 6526 #ifdef __LITTLE_ENDIAN__ 6527 __ai __attribute__((target("neon"))) uint32x2_t vcalt_f32(float32x2_t __p0, float32x2_t __p1) { 6528 uint32x2_t __ret; 6529 __ret = (uint32x2_t) __builtin_neon_vcalt_v((int8x8_t)__p0, (int8x8_t)__p1, 18); 6530 return __ret; 6531 } 6532 #else 6533 __ai __attribute__((target("neon"))) uint32x2_t vcalt_f32(float32x2_t __p0, float32x2_t __p1) { 6534 uint32x2_t __ret; 6535 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 6536 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 6537 __ret = (uint32x2_t) __builtin_neon_vcalt_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18); 6538 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 6539 return __ret; 6540 } 6541 #endif 6542 6543 #ifdef __LITTLE_ENDIAN__ 6544 __ai __attribute__((target("neon"))) uint8x8_t vceq_p8(poly8x8_t __p0, poly8x8_t __p1) { 6545 uint8x8_t __ret; 6546 __ret = (uint8x8_t)(__p0 == __p1); 6547 return __ret; 6548 } 6549 #else 6550 __ai __attribute__((target("neon"))) uint8x8_t vceq_p8(poly8x8_t __p0, poly8x8_t __p1) { 6551 uint8x8_t __ret; 6552 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 6553 poly8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 6554 __ret = (uint8x8_t)(__rev0 == __rev1); 6555 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 6556 return __ret; 6557 } 6558 #endif 6559 6560 #ifdef __LITTLE_ENDIAN__ 6561 __ai __attribute__((target("neon"))) uint8x16_t vceqq_p8(poly8x16_t __p0, poly8x16_t __p1) { 6562 uint8x16_t __ret; 6563 __ret = (uint8x16_t)(__p0 == __p1); 6564 return __ret; 6565 } 6566 #else 6567 __ai __attribute__((target("neon"))) uint8x16_t vceqq_p8(poly8x16_t __p0, poly8x16_t __p1) { 6568 uint8x16_t __ret; 6569 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 6570 poly8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 6571 __ret = (uint8x16_t)(__rev0 == __rev1); 6572 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 6573 return __ret; 6574 } 6575 #endif 6576 6577 #ifdef __LITTLE_ENDIAN__ 6578 __ai __attribute__((target("neon"))) uint8x16_t vceqq_u8(uint8x16_t __p0, uint8x16_t __p1) { 6579 uint8x16_t __ret; 6580 __ret = (uint8x16_t)(__p0 == __p1); 6581 return __ret; 6582 } 6583 #else 6584 __ai __attribute__((target("neon"))) uint8x16_t vceqq_u8(uint8x16_t __p0, uint8x16_t __p1) { 6585 uint8x16_t __ret; 6586 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 6587 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 6588 __ret = (uint8x16_t)(__rev0 == __rev1); 6589 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 6590 return __ret; 6591 } 6592 #endif 6593 6594 #ifdef __LITTLE_ENDIAN__ 6595 __ai __attribute__((target("neon"))) uint32x4_t vceqq_u32(uint32x4_t __p0, uint32x4_t __p1) { 6596 uint32x4_t __ret; 6597 __ret = (uint32x4_t)(__p0 == __p1); 6598 return __ret; 6599 } 6600 #else 6601 __ai __attribute__((target("neon"))) uint32x4_t vceqq_u32(uint32x4_t __p0, uint32x4_t __p1) { 6602 uint32x4_t __ret; 6603 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 6604 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 6605 __ret = (uint32x4_t)(__rev0 == __rev1); 6606 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 6607 return __ret; 6608 } 6609 #endif 6610 6611 #ifdef __LITTLE_ENDIAN__ 6612 __ai __attribute__((target("neon"))) uint16x8_t vceqq_u16(uint16x8_t __p0, uint16x8_t __p1) { 6613 uint16x8_t __ret; 6614 __ret = (uint16x8_t)(__p0 == __p1); 6615 return __ret; 6616 } 6617 #else 6618 __ai __attribute__((target("neon"))) uint16x8_t vceqq_u16(uint16x8_t __p0, uint16x8_t __p1) { 6619 uint16x8_t __ret; 6620 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 6621 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 6622 __ret = (uint16x8_t)(__rev0 == __rev1); 6623 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 6624 return __ret; 6625 } 6626 #endif 6627 6628 #ifdef __LITTLE_ENDIAN__ 6629 __ai __attribute__((target("neon"))) uint8x16_t vceqq_s8(int8x16_t __p0, int8x16_t __p1) { 6630 uint8x16_t __ret; 6631 __ret = (uint8x16_t)(__p0 == __p1); 6632 return __ret; 6633 } 6634 #else 6635 __ai __attribute__((target("neon"))) uint8x16_t vceqq_s8(int8x16_t __p0, int8x16_t __p1) { 6636 uint8x16_t __ret; 6637 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 6638 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 6639 __ret = (uint8x16_t)(__rev0 == __rev1); 6640 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 6641 return __ret; 6642 } 6643 #endif 6644 6645 #ifdef __LITTLE_ENDIAN__ 6646 __ai __attribute__((target("neon"))) uint32x4_t vceqq_f32(float32x4_t __p0, float32x4_t __p1) { 6647 uint32x4_t __ret; 6648 __ret = (uint32x4_t)(__p0 == __p1); 6649 return __ret; 6650 } 6651 #else 6652 __ai __attribute__((target("neon"))) uint32x4_t vceqq_f32(float32x4_t __p0, float32x4_t __p1) { 6653 uint32x4_t __ret; 6654 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 6655 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 6656 __ret = (uint32x4_t)(__rev0 == __rev1); 6657 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 6658 return __ret; 6659 } 6660 #endif 6661 6662 #ifdef __LITTLE_ENDIAN__ 6663 __ai __attribute__((target("neon"))) uint32x4_t vceqq_s32(int32x4_t __p0, int32x4_t __p1) { 6664 uint32x4_t __ret; 6665 __ret = (uint32x4_t)(__p0 == __p1); 6666 return __ret; 6667 } 6668 #else 6669 __ai __attribute__((target("neon"))) uint32x4_t vceqq_s32(int32x4_t __p0, int32x4_t __p1) { 6670 uint32x4_t __ret; 6671 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 6672 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 6673 __ret = (uint32x4_t)(__rev0 == __rev1); 6674 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 6675 return __ret; 6676 } 6677 #endif 6678 6679 #ifdef __LITTLE_ENDIAN__ 6680 __ai __attribute__((target("neon"))) uint16x8_t vceqq_s16(int16x8_t __p0, int16x8_t __p1) { 6681 uint16x8_t __ret; 6682 __ret = (uint16x8_t)(__p0 == __p1); 6683 return __ret; 6684 } 6685 #else 6686 __ai __attribute__((target("neon"))) uint16x8_t vceqq_s16(int16x8_t __p0, int16x8_t __p1) { 6687 uint16x8_t __ret; 6688 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 6689 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 6690 __ret = (uint16x8_t)(__rev0 == __rev1); 6691 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 6692 return __ret; 6693 } 6694 #endif 6695 6696 #ifdef __LITTLE_ENDIAN__ 6697 __ai __attribute__((target("neon"))) uint8x8_t vceq_u8(uint8x8_t __p0, uint8x8_t __p1) { 6698 uint8x8_t __ret; 6699 __ret = (uint8x8_t)(__p0 == __p1); 6700 return __ret; 6701 } 6702 #else 6703 __ai __attribute__((target("neon"))) uint8x8_t vceq_u8(uint8x8_t __p0, uint8x8_t __p1) { 6704 uint8x8_t __ret; 6705 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 6706 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 6707 __ret = (uint8x8_t)(__rev0 == __rev1); 6708 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 6709 return __ret; 6710 } 6711 #endif 6712 6713 #ifdef __LITTLE_ENDIAN__ 6714 __ai __attribute__((target("neon"))) uint32x2_t vceq_u32(uint32x2_t __p0, uint32x2_t __p1) { 6715 uint32x2_t __ret; 6716 __ret = (uint32x2_t)(__p0 == __p1); 6717 return __ret; 6718 } 6719 #else 6720 __ai __attribute__((target("neon"))) uint32x2_t vceq_u32(uint32x2_t __p0, uint32x2_t __p1) { 6721 uint32x2_t __ret; 6722 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 6723 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 6724 __ret = (uint32x2_t)(__rev0 == __rev1); 6725 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 6726 return __ret; 6727 } 6728 #endif 6729 6730 #ifdef __LITTLE_ENDIAN__ 6731 __ai __attribute__((target("neon"))) uint16x4_t vceq_u16(uint16x4_t __p0, uint16x4_t __p1) { 6732 uint16x4_t __ret; 6733 __ret = (uint16x4_t)(__p0 == __p1); 6734 return __ret; 6735 } 6736 #else 6737 __ai __attribute__((target("neon"))) uint16x4_t vceq_u16(uint16x4_t __p0, uint16x4_t __p1) { 6738 uint16x4_t __ret; 6739 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 6740 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 6741 __ret = (uint16x4_t)(__rev0 == __rev1); 6742 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 6743 return __ret; 6744 } 6745 #endif 6746 6747 #ifdef __LITTLE_ENDIAN__ 6748 __ai __attribute__((target("neon"))) uint8x8_t vceq_s8(int8x8_t __p0, int8x8_t __p1) { 6749 uint8x8_t __ret; 6750 __ret = (uint8x8_t)(__p0 == __p1); 6751 return __ret; 6752 } 6753 #else 6754 __ai __attribute__((target("neon"))) uint8x8_t vceq_s8(int8x8_t __p0, int8x8_t __p1) { 6755 uint8x8_t __ret; 6756 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 6757 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 6758 __ret = (uint8x8_t)(__rev0 == __rev1); 6759 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 6760 return __ret; 6761 } 6762 #endif 6763 6764 #ifdef __LITTLE_ENDIAN__ 6765 __ai __attribute__((target("neon"))) uint32x2_t vceq_f32(float32x2_t __p0, float32x2_t __p1) { 6766 uint32x2_t __ret; 6767 __ret = (uint32x2_t)(__p0 == __p1); 6768 return __ret; 6769 } 6770 #else 6771 __ai __attribute__((target("neon"))) uint32x2_t vceq_f32(float32x2_t __p0, float32x2_t __p1) { 6772 uint32x2_t __ret; 6773 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 6774 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 6775 __ret = (uint32x2_t)(__rev0 == __rev1); 6776 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 6777 return __ret; 6778 } 6779 #endif 6780 6781 #ifdef __LITTLE_ENDIAN__ 6782 __ai __attribute__((target("neon"))) uint32x2_t vceq_s32(int32x2_t __p0, int32x2_t __p1) { 6783 uint32x2_t __ret; 6784 __ret = (uint32x2_t)(__p0 == __p1); 6785 return __ret; 6786 } 6787 #else 6788 __ai __attribute__((target("neon"))) uint32x2_t vceq_s32(int32x2_t __p0, int32x2_t __p1) { 6789 uint32x2_t __ret; 6790 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 6791 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 6792 __ret = (uint32x2_t)(__rev0 == __rev1); 6793 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 6794 return __ret; 6795 } 6796 #endif 6797 6798 #ifdef __LITTLE_ENDIAN__ 6799 __ai __attribute__((target("neon"))) uint16x4_t vceq_s16(int16x4_t __p0, int16x4_t __p1) { 6800 uint16x4_t __ret; 6801 __ret = (uint16x4_t)(__p0 == __p1); 6802 return __ret; 6803 } 6804 #else 6805 __ai __attribute__((target("neon"))) uint16x4_t vceq_s16(int16x4_t __p0, int16x4_t __p1) { 6806 uint16x4_t __ret; 6807 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 6808 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 6809 __ret = (uint16x4_t)(__rev0 == __rev1); 6810 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 6811 return __ret; 6812 } 6813 #endif 6814 6815 #ifdef __LITTLE_ENDIAN__ 6816 __ai __attribute__((target("neon"))) uint8x16_t vcgeq_u8(uint8x16_t __p0, uint8x16_t __p1) { 6817 uint8x16_t __ret; 6818 __ret = (uint8x16_t)(__p0 >= __p1); 6819 return __ret; 6820 } 6821 #else 6822 __ai __attribute__((target("neon"))) uint8x16_t vcgeq_u8(uint8x16_t __p0, uint8x16_t __p1) { 6823 uint8x16_t __ret; 6824 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 6825 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 6826 __ret = (uint8x16_t)(__rev0 >= __rev1); 6827 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 6828 return __ret; 6829 } 6830 #endif 6831 6832 #ifdef __LITTLE_ENDIAN__ 6833 __ai __attribute__((target("neon"))) uint32x4_t vcgeq_u32(uint32x4_t __p0, uint32x4_t __p1) { 6834 uint32x4_t __ret; 6835 __ret = (uint32x4_t)(__p0 >= __p1); 6836 return __ret; 6837 } 6838 #else 6839 __ai __attribute__((target("neon"))) uint32x4_t vcgeq_u32(uint32x4_t __p0, uint32x4_t __p1) { 6840 uint32x4_t __ret; 6841 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 6842 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 6843 __ret = (uint32x4_t)(__rev0 >= __rev1); 6844 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 6845 return __ret; 6846 } 6847 #endif 6848 6849 #ifdef __LITTLE_ENDIAN__ 6850 __ai __attribute__((target("neon"))) uint16x8_t vcgeq_u16(uint16x8_t __p0, uint16x8_t __p1) { 6851 uint16x8_t __ret; 6852 __ret = (uint16x8_t)(__p0 >= __p1); 6853 return __ret; 6854 } 6855 #else 6856 __ai __attribute__((target("neon"))) uint16x8_t vcgeq_u16(uint16x8_t __p0, uint16x8_t __p1) { 6857 uint16x8_t __ret; 6858 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 6859 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 6860 __ret = (uint16x8_t)(__rev0 >= __rev1); 6861 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 6862 return __ret; 6863 } 6864 #endif 6865 6866 #ifdef __LITTLE_ENDIAN__ 6867 __ai __attribute__((target("neon"))) uint8x16_t vcgeq_s8(int8x16_t __p0, int8x16_t __p1) { 6868 uint8x16_t __ret; 6869 __ret = (uint8x16_t)(__p0 >= __p1); 6870 return __ret; 6871 } 6872 #else 6873 __ai __attribute__((target("neon"))) uint8x16_t vcgeq_s8(int8x16_t __p0, int8x16_t __p1) { 6874 uint8x16_t __ret; 6875 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 6876 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 6877 __ret = (uint8x16_t)(__rev0 >= __rev1); 6878 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 6879 return __ret; 6880 } 6881 #endif 6882 6883 #ifdef __LITTLE_ENDIAN__ 6884 __ai __attribute__((target("neon"))) uint32x4_t vcgeq_f32(float32x4_t __p0, float32x4_t __p1) { 6885 uint32x4_t __ret; 6886 __ret = (uint32x4_t)(__p0 >= __p1); 6887 return __ret; 6888 } 6889 #else 6890 __ai __attribute__((target("neon"))) uint32x4_t vcgeq_f32(float32x4_t __p0, float32x4_t __p1) { 6891 uint32x4_t __ret; 6892 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 6893 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 6894 __ret = (uint32x4_t)(__rev0 >= __rev1); 6895 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 6896 return __ret; 6897 } 6898 #endif 6899 6900 #ifdef __LITTLE_ENDIAN__ 6901 __ai __attribute__((target("neon"))) uint32x4_t vcgeq_s32(int32x4_t __p0, int32x4_t __p1) { 6902 uint32x4_t __ret; 6903 __ret = (uint32x4_t)(__p0 >= __p1); 6904 return __ret; 6905 } 6906 #else 6907 __ai __attribute__((target("neon"))) uint32x4_t vcgeq_s32(int32x4_t __p0, int32x4_t __p1) { 6908 uint32x4_t __ret; 6909 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 6910 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 6911 __ret = (uint32x4_t)(__rev0 >= __rev1); 6912 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 6913 return __ret; 6914 } 6915 #endif 6916 6917 #ifdef __LITTLE_ENDIAN__ 6918 __ai __attribute__((target("neon"))) uint16x8_t vcgeq_s16(int16x8_t __p0, int16x8_t __p1) { 6919 uint16x8_t __ret; 6920 __ret = (uint16x8_t)(__p0 >= __p1); 6921 return __ret; 6922 } 6923 #else 6924 __ai __attribute__((target("neon"))) uint16x8_t vcgeq_s16(int16x8_t __p0, int16x8_t __p1) { 6925 uint16x8_t __ret; 6926 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 6927 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 6928 __ret = (uint16x8_t)(__rev0 >= __rev1); 6929 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 6930 return __ret; 6931 } 6932 #endif 6933 6934 #ifdef __LITTLE_ENDIAN__ 6935 __ai __attribute__((target("neon"))) uint8x8_t vcge_u8(uint8x8_t __p0, uint8x8_t __p1) { 6936 uint8x8_t __ret; 6937 __ret = (uint8x8_t)(__p0 >= __p1); 6938 return __ret; 6939 } 6940 #else 6941 __ai __attribute__((target("neon"))) uint8x8_t vcge_u8(uint8x8_t __p0, uint8x8_t __p1) { 6942 uint8x8_t __ret; 6943 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 6944 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 6945 __ret = (uint8x8_t)(__rev0 >= __rev1); 6946 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 6947 return __ret; 6948 } 6949 #endif 6950 6951 #ifdef __LITTLE_ENDIAN__ 6952 __ai __attribute__((target("neon"))) uint32x2_t vcge_u32(uint32x2_t __p0, uint32x2_t __p1) { 6953 uint32x2_t __ret; 6954 __ret = (uint32x2_t)(__p0 >= __p1); 6955 return __ret; 6956 } 6957 #else 6958 __ai __attribute__((target("neon"))) uint32x2_t vcge_u32(uint32x2_t __p0, uint32x2_t __p1) { 6959 uint32x2_t __ret; 6960 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 6961 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 6962 __ret = (uint32x2_t)(__rev0 >= __rev1); 6963 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 6964 return __ret; 6965 } 6966 #endif 6967 6968 #ifdef __LITTLE_ENDIAN__ 6969 __ai __attribute__((target("neon"))) uint16x4_t vcge_u16(uint16x4_t __p0, uint16x4_t __p1) { 6970 uint16x4_t __ret; 6971 __ret = (uint16x4_t)(__p0 >= __p1); 6972 return __ret; 6973 } 6974 #else 6975 __ai __attribute__((target("neon"))) uint16x4_t vcge_u16(uint16x4_t __p0, uint16x4_t __p1) { 6976 uint16x4_t __ret; 6977 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 6978 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 6979 __ret = (uint16x4_t)(__rev0 >= __rev1); 6980 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 6981 return __ret; 6982 } 6983 #endif 6984 6985 #ifdef __LITTLE_ENDIAN__ 6986 __ai __attribute__((target("neon"))) uint8x8_t vcge_s8(int8x8_t __p0, int8x8_t __p1) { 6987 uint8x8_t __ret; 6988 __ret = (uint8x8_t)(__p0 >= __p1); 6989 return __ret; 6990 } 6991 #else 6992 __ai __attribute__((target("neon"))) uint8x8_t vcge_s8(int8x8_t __p0, int8x8_t __p1) { 6993 uint8x8_t __ret; 6994 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 6995 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 6996 __ret = (uint8x8_t)(__rev0 >= __rev1); 6997 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 6998 return __ret; 6999 } 7000 #endif 7001 7002 #ifdef __LITTLE_ENDIAN__ 7003 __ai __attribute__((target("neon"))) uint32x2_t vcge_f32(float32x2_t __p0, float32x2_t __p1) { 7004 uint32x2_t __ret; 7005 __ret = (uint32x2_t)(__p0 >= __p1); 7006 return __ret; 7007 } 7008 #else 7009 __ai __attribute__((target("neon"))) uint32x2_t vcge_f32(float32x2_t __p0, float32x2_t __p1) { 7010 uint32x2_t __ret; 7011 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 7012 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 7013 __ret = (uint32x2_t)(__rev0 >= __rev1); 7014 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 7015 return __ret; 7016 } 7017 #endif 7018 7019 #ifdef __LITTLE_ENDIAN__ 7020 __ai __attribute__((target("neon"))) uint32x2_t vcge_s32(int32x2_t __p0, int32x2_t __p1) { 7021 uint32x2_t __ret; 7022 __ret = (uint32x2_t)(__p0 >= __p1); 7023 return __ret; 7024 } 7025 #else 7026 __ai __attribute__((target("neon"))) uint32x2_t vcge_s32(int32x2_t __p0, int32x2_t __p1) { 7027 uint32x2_t __ret; 7028 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 7029 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 7030 __ret = (uint32x2_t)(__rev0 >= __rev1); 7031 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 7032 return __ret; 7033 } 7034 #endif 7035 7036 #ifdef __LITTLE_ENDIAN__ 7037 __ai __attribute__((target("neon"))) uint16x4_t vcge_s16(int16x4_t __p0, int16x4_t __p1) { 7038 uint16x4_t __ret; 7039 __ret = (uint16x4_t)(__p0 >= __p1); 7040 return __ret; 7041 } 7042 #else 7043 __ai __attribute__((target("neon"))) uint16x4_t vcge_s16(int16x4_t __p0, int16x4_t __p1) { 7044 uint16x4_t __ret; 7045 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 7046 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 7047 __ret = (uint16x4_t)(__rev0 >= __rev1); 7048 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 7049 return __ret; 7050 } 7051 #endif 7052 7053 #ifdef __LITTLE_ENDIAN__ 7054 __ai __attribute__((target("neon"))) uint8x16_t vcgtq_u8(uint8x16_t __p0, uint8x16_t __p1) { 7055 uint8x16_t __ret; 7056 __ret = (uint8x16_t)(__p0 > __p1); 7057 return __ret; 7058 } 7059 #else 7060 __ai __attribute__((target("neon"))) uint8x16_t vcgtq_u8(uint8x16_t __p0, uint8x16_t __p1) { 7061 uint8x16_t __ret; 7062 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 7063 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 7064 __ret = (uint8x16_t)(__rev0 > __rev1); 7065 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 7066 return __ret; 7067 } 7068 #endif 7069 7070 #ifdef __LITTLE_ENDIAN__ 7071 __ai __attribute__((target("neon"))) uint32x4_t vcgtq_u32(uint32x4_t __p0, uint32x4_t __p1) { 7072 uint32x4_t __ret; 7073 __ret = (uint32x4_t)(__p0 > __p1); 7074 return __ret; 7075 } 7076 #else 7077 __ai __attribute__((target("neon"))) uint32x4_t vcgtq_u32(uint32x4_t __p0, uint32x4_t __p1) { 7078 uint32x4_t __ret; 7079 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 7080 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 7081 __ret = (uint32x4_t)(__rev0 > __rev1); 7082 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 7083 return __ret; 7084 } 7085 #endif 7086 7087 #ifdef __LITTLE_ENDIAN__ 7088 __ai __attribute__((target("neon"))) uint16x8_t vcgtq_u16(uint16x8_t __p0, uint16x8_t __p1) { 7089 uint16x8_t __ret; 7090 __ret = (uint16x8_t)(__p0 > __p1); 7091 return __ret; 7092 } 7093 #else 7094 __ai __attribute__((target("neon"))) uint16x8_t vcgtq_u16(uint16x8_t __p0, uint16x8_t __p1) { 7095 uint16x8_t __ret; 7096 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 7097 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 7098 __ret = (uint16x8_t)(__rev0 > __rev1); 7099 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 7100 return __ret; 7101 } 7102 #endif 7103 7104 #ifdef __LITTLE_ENDIAN__ 7105 __ai __attribute__((target("neon"))) uint8x16_t vcgtq_s8(int8x16_t __p0, int8x16_t __p1) { 7106 uint8x16_t __ret; 7107 __ret = (uint8x16_t)(__p0 > __p1); 7108 return __ret; 7109 } 7110 #else 7111 __ai __attribute__((target("neon"))) uint8x16_t vcgtq_s8(int8x16_t __p0, int8x16_t __p1) { 7112 uint8x16_t __ret; 7113 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 7114 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 7115 __ret = (uint8x16_t)(__rev0 > __rev1); 7116 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 7117 return __ret; 7118 } 7119 #endif 7120 7121 #ifdef __LITTLE_ENDIAN__ 7122 __ai __attribute__((target("neon"))) uint32x4_t vcgtq_f32(float32x4_t __p0, float32x4_t __p1) { 7123 uint32x4_t __ret; 7124 __ret = (uint32x4_t)(__p0 > __p1); 7125 return __ret; 7126 } 7127 #else 7128 __ai __attribute__((target("neon"))) uint32x4_t vcgtq_f32(float32x4_t __p0, float32x4_t __p1) { 7129 uint32x4_t __ret; 7130 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 7131 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 7132 __ret = (uint32x4_t)(__rev0 > __rev1); 7133 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 7134 return __ret; 7135 } 7136 #endif 7137 7138 #ifdef __LITTLE_ENDIAN__ 7139 __ai __attribute__((target("neon"))) uint32x4_t vcgtq_s32(int32x4_t __p0, int32x4_t __p1) { 7140 uint32x4_t __ret; 7141 __ret = (uint32x4_t)(__p0 > __p1); 7142 return __ret; 7143 } 7144 #else 7145 __ai __attribute__((target("neon"))) uint32x4_t vcgtq_s32(int32x4_t __p0, int32x4_t __p1) { 7146 uint32x4_t __ret; 7147 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 7148 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 7149 __ret = (uint32x4_t)(__rev0 > __rev1); 7150 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 7151 return __ret; 7152 } 7153 #endif 7154 7155 #ifdef __LITTLE_ENDIAN__ 7156 __ai __attribute__((target("neon"))) uint16x8_t vcgtq_s16(int16x8_t __p0, int16x8_t __p1) { 7157 uint16x8_t __ret; 7158 __ret = (uint16x8_t)(__p0 > __p1); 7159 return __ret; 7160 } 7161 #else 7162 __ai __attribute__((target("neon"))) uint16x8_t vcgtq_s16(int16x8_t __p0, int16x8_t __p1) { 7163 uint16x8_t __ret; 7164 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 7165 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 7166 __ret = (uint16x8_t)(__rev0 > __rev1); 7167 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 7168 return __ret; 7169 } 7170 #endif 7171 7172 #ifdef __LITTLE_ENDIAN__ 7173 __ai __attribute__((target("neon"))) uint8x8_t vcgt_u8(uint8x8_t __p0, uint8x8_t __p1) { 7174 uint8x8_t __ret; 7175 __ret = (uint8x8_t)(__p0 > __p1); 7176 return __ret; 7177 } 7178 #else 7179 __ai __attribute__((target("neon"))) uint8x8_t vcgt_u8(uint8x8_t __p0, uint8x8_t __p1) { 7180 uint8x8_t __ret; 7181 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 7182 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 7183 __ret = (uint8x8_t)(__rev0 > __rev1); 7184 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 7185 return __ret; 7186 } 7187 #endif 7188 7189 #ifdef __LITTLE_ENDIAN__ 7190 __ai __attribute__((target("neon"))) uint32x2_t vcgt_u32(uint32x2_t __p0, uint32x2_t __p1) { 7191 uint32x2_t __ret; 7192 __ret = (uint32x2_t)(__p0 > __p1); 7193 return __ret; 7194 } 7195 #else 7196 __ai __attribute__((target("neon"))) uint32x2_t vcgt_u32(uint32x2_t __p0, uint32x2_t __p1) { 7197 uint32x2_t __ret; 7198 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 7199 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 7200 __ret = (uint32x2_t)(__rev0 > __rev1); 7201 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 7202 return __ret; 7203 } 7204 #endif 7205 7206 #ifdef __LITTLE_ENDIAN__ 7207 __ai __attribute__((target("neon"))) uint16x4_t vcgt_u16(uint16x4_t __p0, uint16x4_t __p1) { 7208 uint16x4_t __ret; 7209 __ret = (uint16x4_t)(__p0 > __p1); 7210 return __ret; 7211 } 7212 #else 7213 __ai __attribute__((target("neon"))) uint16x4_t vcgt_u16(uint16x4_t __p0, uint16x4_t __p1) { 7214 uint16x4_t __ret; 7215 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 7216 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 7217 __ret = (uint16x4_t)(__rev0 > __rev1); 7218 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 7219 return __ret; 7220 } 7221 #endif 7222 7223 #ifdef __LITTLE_ENDIAN__ 7224 __ai __attribute__((target("neon"))) uint8x8_t vcgt_s8(int8x8_t __p0, int8x8_t __p1) { 7225 uint8x8_t __ret; 7226 __ret = (uint8x8_t)(__p0 > __p1); 7227 return __ret; 7228 } 7229 #else 7230 __ai __attribute__((target("neon"))) uint8x8_t vcgt_s8(int8x8_t __p0, int8x8_t __p1) { 7231 uint8x8_t __ret; 7232 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 7233 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 7234 __ret = (uint8x8_t)(__rev0 > __rev1); 7235 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 7236 return __ret; 7237 } 7238 #endif 7239 7240 #ifdef __LITTLE_ENDIAN__ 7241 __ai __attribute__((target("neon"))) uint32x2_t vcgt_f32(float32x2_t __p0, float32x2_t __p1) { 7242 uint32x2_t __ret; 7243 __ret = (uint32x2_t)(__p0 > __p1); 7244 return __ret; 7245 } 7246 #else 7247 __ai __attribute__((target("neon"))) uint32x2_t vcgt_f32(float32x2_t __p0, float32x2_t __p1) { 7248 uint32x2_t __ret; 7249 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 7250 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 7251 __ret = (uint32x2_t)(__rev0 > __rev1); 7252 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 7253 return __ret; 7254 } 7255 #endif 7256 7257 #ifdef __LITTLE_ENDIAN__ 7258 __ai __attribute__((target("neon"))) uint32x2_t vcgt_s32(int32x2_t __p0, int32x2_t __p1) { 7259 uint32x2_t __ret; 7260 __ret = (uint32x2_t)(__p0 > __p1); 7261 return __ret; 7262 } 7263 #else 7264 __ai __attribute__((target("neon"))) uint32x2_t vcgt_s32(int32x2_t __p0, int32x2_t __p1) { 7265 uint32x2_t __ret; 7266 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 7267 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 7268 __ret = (uint32x2_t)(__rev0 > __rev1); 7269 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 7270 return __ret; 7271 } 7272 #endif 7273 7274 #ifdef __LITTLE_ENDIAN__ 7275 __ai __attribute__((target("neon"))) uint16x4_t vcgt_s16(int16x4_t __p0, int16x4_t __p1) { 7276 uint16x4_t __ret; 7277 __ret = (uint16x4_t)(__p0 > __p1); 7278 return __ret; 7279 } 7280 #else 7281 __ai __attribute__((target("neon"))) uint16x4_t vcgt_s16(int16x4_t __p0, int16x4_t __p1) { 7282 uint16x4_t __ret; 7283 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 7284 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 7285 __ret = (uint16x4_t)(__rev0 > __rev1); 7286 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 7287 return __ret; 7288 } 7289 #endif 7290 7291 #ifdef __LITTLE_ENDIAN__ 7292 __ai __attribute__((target("neon"))) uint8x16_t vcleq_u8(uint8x16_t __p0, uint8x16_t __p1) { 7293 uint8x16_t __ret; 7294 __ret = (uint8x16_t)(__p0 <= __p1); 7295 return __ret; 7296 } 7297 #else 7298 __ai __attribute__((target("neon"))) uint8x16_t vcleq_u8(uint8x16_t __p0, uint8x16_t __p1) { 7299 uint8x16_t __ret; 7300 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 7301 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 7302 __ret = (uint8x16_t)(__rev0 <= __rev1); 7303 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 7304 return __ret; 7305 } 7306 #endif 7307 7308 #ifdef __LITTLE_ENDIAN__ 7309 __ai __attribute__((target("neon"))) uint32x4_t vcleq_u32(uint32x4_t __p0, uint32x4_t __p1) { 7310 uint32x4_t __ret; 7311 __ret = (uint32x4_t)(__p0 <= __p1); 7312 return __ret; 7313 } 7314 #else 7315 __ai __attribute__((target("neon"))) uint32x4_t vcleq_u32(uint32x4_t __p0, uint32x4_t __p1) { 7316 uint32x4_t __ret; 7317 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 7318 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 7319 __ret = (uint32x4_t)(__rev0 <= __rev1); 7320 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 7321 return __ret; 7322 } 7323 #endif 7324 7325 #ifdef __LITTLE_ENDIAN__ 7326 __ai __attribute__((target("neon"))) uint16x8_t vcleq_u16(uint16x8_t __p0, uint16x8_t __p1) { 7327 uint16x8_t __ret; 7328 __ret = (uint16x8_t)(__p0 <= __p1); 7329 return __ret; 7330 } 7331 #else 7332 __ai __attribute__((target("neon"))) uint16x8_t vcleq_u16(uint16x8_t __p0, uint16x8_t __p1) { 7333 uint16x8_t __ret; 7334 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 7335 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 7336 __ret = (uint16x8_t)(__rev0 <= __rev1); 7337 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 7338 return __ret; 7339 } 7340 #endif 7341 7342 #ifdef __LITTLE_ENDIAN__ 7343 __ai __attribute__((target("neon"))) uint8x16_t vcleq_s8(int8x16_t __p0, int8x16_t __p1) { 7344 uint8x16_t __ret; 7345 __ret = (uint8x16_t)(__p0 <= __p1); 7346 return __ret; 7347 } 7348 #else 7349 __ai __attribute__((target("neon"))) uint8x16_t vcleq_s8(int8x16_t __p0, int8x16_t __p1) { 7350 uint8x16_t __ret; 7351 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 7352 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 7353 __ret = (uint8x16_t)(__rev0 <= __rev1); 7354 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 7355 return __ret; 7356 } 7357 #endif 7358 7359 #ifdef __LITTLE_ENDIAN__ 7360 __ai __attribute__((target("neon"))) uint32x4_t vcleq_f32(float32x4_t __p0, float32x4_t __p1) { 7361 uint32x4_t __ret; 7362 __ret = (uint32x4_t)(__p0 <= __p1); 7363 return __ret; 7364 } 7365 #else 7366 __ai __attribute__((target("neon"))) uint32x4_t vcleq_f32(float32x4_t __p0, float32x4_t __p1) { 7367 uint32x4_t __ret; 7368 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 7369 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 7370 __ret = (uint32x4_t)(__rev0 <= __rev1); 7371 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 7372 return __ret; 7373 } 7374 #endif 7375 7376 #ifdef __LITTLE_ENDIAN__ 7377 __ai __attribute__((target("neon"))) uint32x4_t vcleq_s32(int32x4_t __p0, int32x4_t __p1) { 7378 uint32x4_t __ret; 7379 __ret = (uint32x4_t)(__p0 <= __p1); 7380 return __ret; 7381 } 7382 #else 7383 __ai __attribute__((target("neon"))) uint32x4_t vcleq_s32(int32x4_t __p0, int32x4_t __p1) { 7384 uint32x4_t __ret; 7385 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 7386 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 7387 __ret = (uint32x4_t)(__rev0 <= __rev1); 7388 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 7389 return __ret; 7390 } 7391 #endif 7392 7393 #ifdef __LITTLE_ENDIAN__ 7394 __ai __attribute__((target("neon"))) uint16x8_t vcleq_s16(int16x8_t __p0, int16x8_t __p1) { 7395 uint16x8_t __ret; 7396 __ret = (uint16x8_t)(__p0 <= __p1); 7397 return __ret; 7398 } 7399 #else 7400 __ai __attribute__((target("neon"))) uint16x8_t vcleq_s16(int16x8_t __p0, int16x8_t __p1) { 7401 uint16x8_t __ret; 7402 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 7403 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 7404 __ret = (uint16x8_t)(__rev0 <= __rev1); 7405 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 7406 return __ret; 7407 } 7408 #endif 7409 7410 #ifdef __LITTLE_ENDIAN__ 7411 __ai __attribute__((target("neon"))) uint8x8_t vcle_u8(uint8x8_t __p0, uint8x8_t __p1) { 7412 uint8x8_t __ret; 7413 __ret = (uint8x8_t)(__p0 <= __p1); 7414 return __ret; 7415 } 7416 #else 7417 __ai __attribute__((target("neon"))) uint8x8_t vcle_u8(uint8x8_t __p0, uint8x8_t __p1) { 7418 uint8x8_t __ret; 7419 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 7420 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 7421 __ret = (uint8x8_t)(__rev0 <= __rev1); 7422 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 7423 return __ret; 7424 } 7425 #endif 7426 7427 #ifdef __LITTLE_ENDIAN__ 7428 __ai __attribute__((target("neon"))) uint32x2_t vcle_u32(uint32x2_t __p0, uint32x2_t __p1) { 7429 uint32x2_t __ret; 7430 __ret = (uint32x2_t)(__p0 <= __p1); 7431 return __ret; 7432 } 7433 #else 7434 __ai __attribute__((target("neon"))) uint32x2_t vcle_u32(uint32x2_t __p0, uint32x2_t __p1) { 7435 uint32x2_t __ret; 7436 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 7437 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 7438 __ret = (uint32x2_t)(__rev0 <= __rev1); 7439 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 7440 return __ret; 7441 } 7442 #endif 7443 7444 #ifdef __LITTLE_ENDIAN__ 7445 __ai __attribute__((target("neon"))) uint16x4_t vcle_u16(uint16x4_t __p0, uint16x4_t __p1) { 7446 uint16x4_t __ret; 7447 __ret = (uint16x4_t)(__p0 <= __p1); 7448 return __ret; 7449 } 7450 #else 7451 __ai __attribute__((target("neon"))) uint16x4_t vcle_u16(uint16x4_t __p0, uint16x4_t __p1) { 7452 uint16x4_t __ret; 7453 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 7454 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 7455 __ret = (uint16x4_t)(__rev0 <= __rev1); 7456 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 7457 return __ret; 7458 } 7459 #endif 7460 7461 #ifdef __LITTLE_ENDIAN__ 7462 __ai __attribute__((target("neon"))) uint8x8_t vcle_s8(int8x8_t __p0, int8x8_t __p1) { 7463 uint8x8_t __ret; 7464 __ret = (uint8x8_t)(__p0 <= __p1); 7465 return __ret; 7466 } 7467 #else 7468 __ai __attribute__((target("neon"))) uint8x8_t vcle_s8(int8x8_t __p0, int8x8_t __p1) { 7469 uint8x8_t __ret; 7470 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 7471 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 7472 __ret = (uint8x8_t)(__rev0 <= __rev1); 7473 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 7474 return __ret; 7475 } 7476 #endif 7477 7478 #ifdef __LITTLE_ENDIAN__ 7479 __ai __attribute__((target("neon"))) uint32x2_t vcle_f32(float32x2_t __p0, float32x2_t __p1) { 7480 uint32x2_t __ret; 7481 __ret = (uint32x2_t)(__p0 <= __p1); 7482 return __ret; 7483 } 7484 #else 7485 __ai __attribute__((target("neon"))) uint32x2_t vcle_f32(float32x2_t __p0, float32x2_t __p1) { 7486 uint32x2_t __ret; 7487 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 7488 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 7489 __ret = (uint32x2_t)(__rev0 <= __rev1); 7490 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 7491 return __ret; 7492 } 7493 #endif 7494 7495 #ifdef __LITTLE_ENDIAN__ 7496 __ai __attribute__((target("neon"))) uint32x2_t vcle_s32(int32x2_t __p0, int32x2_t __p1) { 7497 uint32x2_t __ret; 7498 __ret = (uint32x2_t)(__p0 <= __p1); 7499 return __ret; 7500 } 7501 #else 7502 __ai __attribute__((target("neon"))) uint32x2_t vcle_s32(int32x2_t __p0, int32x2_t __p1) { 7503 uint32x2_t __ret; 7504 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 7505 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 7506 __ret = (uint32x2_t)(__rev0 <= __rev1); 7507 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 7508 return __ret; 7509 } 7510 #endif 7511 7512 #ifdef __LITTLE_ENDIAN__ 7513 __ai __attribute__((target("neon"))) uint16x4_t vcle_s16(int16x4_t __p0, int16x4_t __p1) { 7514 uint16x4_t __ret; 7515 __ret = (uint16x4_t)(__p0 <= __p1); 7516 return __ret; 7517 } 7518 #else 7519 __ai __attribute__((target("neon"))) uint16x4_t vcle_s16(int16x4_t __p0, int16x4_t __p1) { 7520 uint16x4_t __ret; 7521 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 7522 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 7523 __ret = (uint16x4_t)(__rev0 <= __rev1); 7524 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 7525 return __ret; 7526 } 7527 #endif 7528 7529 #ifdef __LITTLE_ENDIAN__ 7530 __ai __attribute__((target("neon"))) int8x16_t vclsq_u8(uint8x16_t __p0) { 7531 int8x16_t __ret; 7532 __ret = (int8x16_t) __builtin_neon_vclsq_v((int8x16_t)__p0, 32); 7533 return __ret; 7534 } 7535 #else 7536 __ai __attribute__((target("neon"))) int8x16_t vclsq_u8(uint8x16_t __p0) { 7537 int8x16_t __ret; 7538 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 7539 __ret = (int8x16_t) __builtin_neon_vclsq_v((int8x16_t)__rev0, 32); 7540 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 7541 return __ret; 7542 } 7543 #endif 7544 7545 #ifdef __LITTLE_ENDIAN__ 7546 __ai __attribute__((target("neon"))) int32x4_t vclsq_u32(uint32x4_t __p0) { 7547 int32x4_t __ret; 7548 __ret = (int32x4_t) __builtin_neon_vclsq_v((int8x16_t)__p0, 34); 7549 return __ret; 7550 } 7551 #else 7552 __ai __attribute__((target("neon"))) int32x4_t vclsq_u32(uint32x4_t __p0) { 7553 int32x4_t __ret; 7554 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 7555 __ret = (int32x4_t) __builtin_neon_vclsq_v((int8x16_t)__rev0, 34); 7556 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 7557 return __ret; 7558 } 7559 #endif 7560 7561 #ifdef __LITTLE_ENDIAN__ 7562 __ai __attribute__((target("neon"))) int16x8_t vclsq_u16(uint16x8_t __p0) { 7563 int16x8_t __ret; 7564 __ret = (int16x8_t) __builtin_neon_vclsq_v((int8x16_t)__p0, 33); 7565 return __ret; 7566 } 7567 #else 7568 __ai __attribute__((target("neon"))) int16x8_t vclsq_u16(uint16x8_t __p0) { 7569 int16x8_t __ret; 7570 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 7571 __ret = (int16x8_t) __builtin_neon_vclsq_v((int8x16_t)__rev0, 33); 7572 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 7573 return __ret; 7574 } 7575 #endif 7576 7577 #ifdef __LITTLE_ENDIAN__ 7578 __ai __attribute__((target("neon"))) int8x16_t vclsq_s8(int8x16_t __p0) { 7579 int8x16_t __ret; 7580 __ret = (int8x16_t) __builtin_neon_vclsq_v((int8x16_t)__p0, 32); 7581 return __ret; 7582 } 7583 #else 7584 __ai __attribute__((target("neon"))) int8x16_t vclsq_s8(int8x16_t __p0) { 7585 int8x16_t __ret; 7586 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 7587 __ret = (int8x16_t) __builtin_neon_vclsq_v((int8x16_t)__rev0, 32); 7588 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 7589 return __ret; 7590 } 7591 #endif 7592 7593 #ifdef __LITTLE_ENDIAN__ 7594 __ai __attribute__((target("neon"))) int32x4_t vclsq_s32(int32x4_t __p0) { 7595 int32x4_t __ret; 7596 __ret = (int32x4_t) __builtin_neon_vclsq_v((int8x16_t)__p0, 34); 7597 return __ret; 7598 } 7599 #else 7600 __ai __attribute__((target("neon"))) int32x4_t vclsq_s32(int32x4_t __p0) { 7601 int32x4_t __ret; 7602 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 7603 __ret = (int32x4_t) __builtin_neon_vclsq_v((int8x16_t)__rev0, 34); 7604 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 7605 return __ret; 7606 } 7607 #endif 7608 7609 #ifdef __LITTLE_ENDIAN__ 7610 __ai __attribute__((target("neon"))) int16x8_t vclsq_s16(int16x8_t __p0) { 7611 int16x8_t __ret; 7612 __ret = (int16x8_t) __builtin_neon_vclsq_v((int8x16_t)__p0, 33); 7613 return __ret; 7614 } 7615 #else 7616 __ai __attribute__((target("neon"))) int16x8_t vclsq_s16(int16x8_t __p0) { 7617 int16x8_t __ret; 7618 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 7619 __ret = (int16x8_t) __builtin_neon_vclsq_v((int8x16_t)__rev0, 33); 7620 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 7621 return __ret; 7622 } 7623 #endif 7624 7625 #ifdef __LITTLE_ENDIAN__ 7626 __ai __attribute__((target("neon"))) int8x8_t vcls_u8(uint8x8_t __p0) { 7627 int8x8_t __ret; 7628 __ret = (int8x8_t) __builtin_neon_vcls_v((int8x8_t)__p0, 0); 7629 return __ret; 7630 } 7631 #else 7632 __ai __attribute__((target("neon"))) int8x8_t vcls_u8(uint8x8_t __p0) { 7633 int8x8_t __ret; 7634 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 7635 __ret = (int8x8_t) __builtin_neon_vcls_v((int8x8_t)__rev0, 0); 7636 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 7637 return __ret; 7638 } 7639 #endif 7640 7641 #ifdef __LITTLE_ENDIAN__ 7642 __ai __attribute__((target("neon"))) int32x2_t vcls_u32(uint32x2_t __p0) { 7643 int32x2_t __ret; 7644 __ret = (int32x2_t) __builtin_neon_vcls_v((int8x8_t)__p0, 2); 7645 return __ret; 7646 } 7647 #else 7648 __ai __attribute__((target("neon"))) int32x2_t vcls_u32(uint32x2_t __p0) { 7649 int32x2_t __ret; 7650 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 7651 __ret = (int32x2_t) __builtin_neon_vcls_v((int8x8_t)__rev0, 2); 7652 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 7653 return __ret; 7654 } 7655 #endif 7656 7657 #ifdef __LITTLE_ENDIAN__ 7658 __ai __attribute__((target("neon"))) int16x4_t vcls_u16(uint16x4_t __p0) { 7659 int16x4_t __ret; 7660 __ret = (int16x4_t) __builtin_neon_vcls_v((int8x8_t)__p0, 1); 7661 return __ret; 7662 } 7663 #else 7664 __ai __attribute__((target("neon"))) int16x4_t vcls_u16(uint16x4_t __p0) { 7665 int16x4_t __ret; 7666 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 7667 __ret = (int16x4_t) __builtin_neon_vcls_v((int8x8_t)__rev0, 1); 7668 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 7669 return __ret; 7670 } 7671 #endif 7672 7673 #ifdef __LITTLE_ENDIAN__ 7674 __ai __attribute__((target("neon"))) int8x8_t vcls_s8(int8x8_t __p0) { 7675 int8x8_t __ret; 7676 __ret = (int8x8_t) __builtin_neon_vcls_v((int8x8_t)__p0, 0); 7677 return __ret; 7678 } 7679 #else 7680 __ai __attribute__((target("neon"))) int8x8_t vcls_s8(int8x8_t __p0) { 7681 int8x8_t __ret; 7682 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 7683 __ret = (int8x8_t) __builtin_neon_vcls_v((int8x8_t)__rev0, 0); 7684 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 7685 return __ret; 7686 } 7687 #endif 7688 7689 #ifdef __LITTLE_ENDIAN__ 7690 __ai __attribute__((target("neon"))) int32x2_t vcls_s32(int32x2_t __p0) { 7691 int32x2_t __ret; 7692 __ret = (int32x2_t) __builtin_neon_vcls_v((int8x8_t)__p0, 2); 7693 return __ret; 7694 } 7695 #else 7696 __ai __attribute__((target("neon"))) int32x2_t vcls_s32(int32x2_t __p0) { 7697 int32x2_t __ret; 7698 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 7699 __ret = (int32x2_t) __builtin_neon_vcls_v((int8x8_t)__rev0, 2); 7700 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 7701 return __ret; 7702 } 7703 #endif 7704 7705 #ifdef __LITTLE_ENDIAN__ 7706 __ai __attribute__((target("neon"))) int16x4_t vcls_s16(int16x4_t __p0) { 7707 int16x4_t __ret; 7708 __ret = (int16x4_t) __builtin_neon_vcls_v((int8x8_t)__p0, 1); 7709 return __ret; 7710 } 7711 #else 7712 __ai __attribute__((target("neon"))) int16x4_t vcls_s16(int16x4_t __p0) { 7713 int16x4_t __ret; 7714 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 7715 __ret = (int16x4_t) __builtin_neon_vcls_v((int8x8_t)__rev0, 1); 7716 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 7717 return __ret; 7718 } 7719 #endif 7720 7721 #ifdef __LITTLE_ENDIAN__ 7722 __ai __attribute__((target("neon"))) uint8x16_t vcltq_u8(uint8x16_t __p0, uint8x16_t __p1) { 7723 uint8x16_t __ret; 7724 __ret = (uint8x16_t)(__p0 < __p1); 7725 return __ret; 7726 } 7727 #else 7728 __ai __attribute__((target("neon"))) uint8x16_t vcltq_u8(uint8x16_t __p0, uint8x16_t __p1) { 7729 uint8x16_t __ret; 7730 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 7731 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 7732 __ret = (uint8x16_t)(__rev0 < __rev1); 7733 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 7734 return __ret; 7735 } 7736 #endif 7737 7738 #ifdef __LITTLE_ENDIAN__ 7739 __ai __attribute__((target("neon"))) uint32x4_t vcltq_u32(uint32x4_t __p0, uint32x4_t __p1) { 7740 uint32x4_t __ret; 7741 __ret = (uint32x4_t)(__p0 < __p1); 7742 return __ret; 7743 } 7744 #else 7745 __ai __attribute__((target("neon"))) uint32x4_t vcltq_u32(uint32x4_t __p0, uint32x4_t __p1) { 7746 uint32x4_t __ret; 7747 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 7748 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 7749 __ret = (uint32x4_t)(__rev0 < __rev1); 7750 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 7751 return __ret; 7752 } 7753 #endif 7754 7755 #ifdef __LITTLE_ENDIAN__ 7756 __ai __attribute__((target("neon"))) uint16x8_t vcltq_u16(uint16x8_t __p0, uint16x8_t __p1) { 7757 uint16x8_t __ret; 7758 __ret = (uint16x8_t)(__p0 < __p1); 7759 return __ret; 7760 } 7761 #else 7762 __ai __attribute__((target("neon"))) uint16x8_t vcltq_u16(uint16x8_t __p0, uint16x8_t __p1) { 7763 uint16x8_t __ret; 7764 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 7765 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 7766 __ret = (uint16x8_t)(__rev0 < __rev1); 7767 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 7768 return __ret; 7769 } 7770 #endif 7771 7772 #ifdef __LITTLE_ENDIAN__ 7773 __ai __attribute__((target("neon"))) uint8x16_t vcltq_s8(int8x16_t __p0, int8x16_t __p1) { 7774 uint8x16_t __ret; 7775 __ret = (uint8x16_t)(__p0 < __p1); 7776 return __ret; 7777 } 7778 #else 7779 __ai __attribute__((target("neon"))) uint8x16_t vcltq_s8(int8x16_t __p0, int8x16_t __p1) { 7780 uint8x16_t __ret; 7781 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 7782 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 7783 __ret = (uint8x16_t)(__rev0 < __rev1); 7784 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 7785 return __ret; 7786 } 7787 #endif 7788 7789 #ifdef __LITTLE_ENDIAN__ 7790 __ai __attribute__((target("neon"))) uint32x4_t vcltq_f32(float32x4_t __p0, float32x4_t __p1) { 7791 uint32x4_t __ret; 7792 __ret = (uint32x4_t)(__p0 < __p1); 7793 return __ret; 7794 } 7795 #else 7796 __ai __attribute__((target("neon"))) uint32x4_t vcltq_f32(float32x4_t __p0, float32x4_t __p1) { 7797 uint32x4_t __ret; 7798 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 7799 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 7800 __ret = (uint32x4_t)(__rev0 < __rev1); 7801 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 7802 return __ret; 7803 } 7804 #endif 7805 7806 #ifdef __LITTLE_ENDIAN__ 7807 __ai __attribute__((target("neon"))) uint32x4_t vcltq_s32(int32x4_t __p0, int32x4_t __p1) { 7808 uint32x4_t __ret; 7809 __ret = (uint32x4_t)(__p0 < __p1); 7810 return __ret; 7811 } 7812 #else 7813 __ai __attribute__((target("neon"))) uint32x4_t vcltq_s32(int32x4_t __p0, int32x4_t __p1) { 7814 uint32x4_t __ret; 7815 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 7816 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 7817 __ret = (uint32x4_t)(__rev0 < __rev1); 7818 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 7819 return __ret; 7820 } 7821 #endif 7822 7823 #ifdef __LITTLE_ENDIAN__ 7824 __ai __attribute__((target("neon"))) uint16x8_t vcltq_s16(int16x8_t __p0, int16x8_t __p1) { 7825 uint16x8_t __ret; 7826 __ret = (uint16x8_t)(__p0 < __p1); 7827 return __ret; 7828 } 7829 #else 7830 __ai __attribute__((target("neon"))) uint16x8_t vcltq_s16(int16x8_t __p0, int16x8_t __p1) { 7831 uint16x8_t __ret; 7832 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 7833 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 7834 __ret = (uint16x8_t)(__rev0 < __rev1); 7835 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 7836 return __ret; 7837 } 7838 #endif 7839 7840 #ifdef __LITTLE_ENDIAN__ 7841 __ai __attribute__((target("neon"))) uint8x8_t vclt_u8(uint8x8_t __p0, uint8x8_t __p1) { 7842 uint8x8_t __ret; 7843 __ret = (uint8x8_t)(__p0 < __p1); 7844 return __ret; 7845 } 7846 #else 7847 __ai __attribute__((target("neon"))) uint8x8_t vclt_u8(uint8x8_t __p0, uint8x8_t __p1) { 7848 uint8x8_t __ret; 7849 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 7850 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 7851 __ret = (uint8x8_t)(__rev0 < __rev1); 7852 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 7853 return __ret; 7854 } 7855 #endif 7856 7857 #ifdef __LITTLE_ENDIAN__ 7858 __ai __attribute__((target("neon"))) uint32x2_t vclt_u32(uint32x2_t __p0, uint32x2_t __p1) { 7859 uint32x2_t __ret; 7860 __ret = (uint32x2_t)(__p0 < __p1); 7861 return __ret; 7862 } 7863 #else 7864 __ai __attribute__((target("neon"))) uint32x2_t vclt_u32(uint32x2_t __p0, uint32x2_t __p1) { 7865 uint32x2_t __ret; 7866 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 7867 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 7868 __ret = (uint32x2_t)(__rev0 < __rev1); 7869 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 7870 return __ret; 7871 } 7872 #endif 7873 7874 #ifdef __LITTLE_ENDIAN__ 7875 __ai __attribute__((target("neon"))) uint16x4_t vclt_u16(uint16x4_t __p0, uint16x4_t __p1) { 7876 uint16x4_t __ret; 7877 __ret = (uint16x4_t)(__p0 < __p1); 7878 return __ret; 7879 } 7880 #else 7881 __ai __attribute__((target("neon"))) uint16x4_t vclt_u16(uint16x4_t __p0, uint16x4_t __p1) { 7882 uint16x4_t __ret; 7883 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 7884 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 7885 __ret = (uint16x4_t)(__rev0 < __rev1); 7886 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 7887 return __ret; 7888 } 7889 #endif 7890 7891 #ifdef __LITTLE_ENDIAN__ 7892 __ai __attribute__((target("neon"))) uint8x8_t vclt_s8(int8x8_t __p0, int8x8_t __p1) { 7893 uint8x8_t __ret; 7894 __ret = (uint8x8_t)(__p0 < __p1); 7895 return __ret; 7896 } 7897 #else 7898 __ai __attribute__((target("neon"))) uint8x8_t vclt_s8(int8x8_t __p0, int8x8_t __p1) { 7899 uint8x8_t __ret; 7900 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 7901 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 7902 __ret = (uint8x8_t)(__rev0 < __rev1); 7903 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 7904 return __ret; 7905 } 7906 #endif 7907 7908 #ifdef __LITTLE_ENDIAN__ 7909 __ai __attribute__((target("neon"))) uint32x2_t vclt_f32(float32x2_t __p0, float32x2_t __p1) { 7910 uint32x2_t __ret; 7911 __ret = (uint32x2_t)(__p0 < __p1); 7912 return __ret; 7913 } 7914 #else 7915 __ai __attribute__((target("neon"))) uint32x2_t vclt_f32(float32x2_t __p0, float32x2_t __p1) { 7916 uint32x2_t __ret; 7917 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 7918 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 7919 __ret = (uint32x2_t)(__rev0 < __rev1); 7920 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 7921 return __ret; 7922 } 7923 #endif 7924 7925 #ifdef __LITTLE_ENDIAN__ 7926 __ai __attribute__((target("neon"))) uint32x2_t vclt_s32(int32x2_t __p0, int32x2_t __p1) { 7927 uint32x2_t __ret; 7928 __ret = (uint32x2_t)(__p0 < __p1); 7929 return __ret; 7930 } 7931 #else 7932 __ai __attribute__((target("neon"))) uint32x2_t vclt_s32(int32x2_t __p0, int32x2_t __p1) { 7933 uint32x2_t __ret; 7934 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 7935 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 7936 __ret = (uint32x2_t)(__rev0 < __rev1); 7937 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 7938 return __ret; 7939 } 7940 #endif 7941 7942 #ifdef __LITTLE_ENDIAN__ 7943 __ai __attribute__((target("neon"))) uint16x4_t vclt_s16(int16x4_t __p0, int16x4_t __p1) { 7944 uint16x4_t __ret; 7945 __ret = (uint16x4_t)(__p0 < __p1); 7946 return __ret; 7947 } 7948 #else 7949 __ai __attribute__((target("neon"))) uint16x4_t vclt_s16(int16x4_t __p0, int16x4_t __p1) { 7950 uint16x4_t __ret; 7951 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 7952 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 7953 __ret = (uint16x4_t)(__rev0 < __rev1); 7954 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 7955 return __ret; 7956 } 7957 #endif 7958 7959 #ifdef __LITTLE_ENDIAN__ 7960 __ai __attribute__((target("neon"))) uint8x16_t vclzq_u8(uint8x16_t __p0) { 7961 uint8x16_t __ret; 7962 __ret = (uint8x16_t) __builtin_neon_vclzq_v((int8x16_t)__p0, 48); 7963 return __ret; 7964 } 7965 #else 7966 __ai __attribute__((target("neon"))) uint8x16_t vclzq_u8(uint8x16_t __p0) { 7967 uint8x16_t __ret; 7968 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 7969 __ret = (uint8x16_t) __builtin_neon_vclzq_v((int8x16_t)__rev0, 48); 7970 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 7971 return __ret; 7972 } 7973 #endif 7974 7975 #ifdef __LITTLE_ENDIAN__ 7976 __ai __attribute__((target("neon"))) uint32x4_t vclzq_u32(uint32x4_t __p0) { 7977 uint32x4_t __ret; 7978 __ret = (uint32x4_t) __builtin_neon_vclzq_v((int8x16_t)__p0, 50); 7979 return __ret; 7980 } 7981 #else 7982 __ai __attribute__((target("neon"))) uint32x4_t vclzq_u32(uint32x4_t __p0) { 7983 uint32x4_t __ret; 7984 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 7985 __ret = (uint32x4_t) __builtin_neon_vclzq_v((int8x16_t)__rev0, 50); 7986 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 7987 return __ret; 7988 } 7989 #endif 7990 7991 #ifdef __LITTLE_ENDIAN__ 7992 __ai __attribute__((target("neon"))) uint16x8_t vclzq_u16(uint16x8_t __p0) { 7993 uint16x8_t __ret; 7994 __ret = (uint16x8_t) __builtin_neon_vclzq_v((int8x16_t)__p0, 49); 7995 return __ret; 7996 } 7997 #else 7998 __ai __attribute__((target("neon"))) uint16x8_t vclzq_u16(uint16x8_t __p0) { 7999 uint16x8_t __ret; 8000 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 8001 __ret = (uint16x8_t) __builtin_neon_vclzq_v((int8x16_t)__rev0, 49); 8002 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 8003 return __ret; 8004 } 8005 #endif 8006 8007 #ifdef __LITTLE_ENDIAN__ 8008 __ai __attribute__((target("neon"))) int8x16_t vclzq_s8(int8x16_t __p0) { 8009 int8x16_t __ret; 8010 __ret = (int8x16_t) __builtin_neon_vclzq_v((int8x16_t)__p0, 32); 8011 return __ret; 8012 } 8013 #else 8014 __ai __attribute__((target("neon"))) int8x16_t vclzq_s8(int8x16_t __p0) { 8015 int8x16_t __ret; 8016 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 8017 __ret = (int8x16_t) __builtin_neon_vclzq_v((int8x16_t)__rev0, 32); 8018 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 8019 return __ret; 8020 } 8021 #endif 8022 8023 #ifdef __LITTLE_ENDIAN__ 8024 __ai __attribute__((target("neon"))) int32x4_t vclzq_s32(int32x4_t __p0) { 8025 int32x4_t __ret; 8026 __ret = (int32x4_t) __builtin_neon_vclzq_v((int8x16_t)__p0, 34); 8027 return __ret; 8028 } 8029 #else 8030 __ai __attribute__((target("neon"))) int32x4_t vclzq_s32(int32x4_t __p0) { 8031 int32x4_t __ret; 8032 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 8033 __ret = (int32x4_t) __builtin_neon_vclzq_v((int8x16_t)__rev0, 34); 8034 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 8035 return __ret; 8036 } 8037 #endif 8038 8039 #ifdef __LITTLE_ENDIAN__ 8040 __ai __attribute__((target("neon"))) int16x8_t vclzq_s16(int16x8_t __p0) { 8041 int16x8_t __ret; 8042 __ret = (int16x8_t) __builtin_neon_vclzq_v((int8x16_t)__p0, 33); 8043 return __ret; 8044 } 8045 #else 8046 __ai __attribute__((target("neon"))) int16x8_t vclzq_s16(int16x8_t __p0) { 8047 int16x8_t __ret; 8048 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 8049 __ret = (int16x8_t) __builtin_neon_vclzq_v((int8x16_t)__rev0, 33); 8050 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 8051 return __ret; 8052 } 8053 #endif 8054 8055 #ifdef __LITTLE_ENDIAN__ 8056 __ai __attribute__((target("neon"))) uint8x8_t vclz_u8(uint8x8_t __p0) { 8057 uint8x8_t __ret; 8058 __ret = (uint8x8_t) __builtin_neon_vclz_v((int8x8_t)__p0, 16); 8059 return __ret; 8060 } 8061 #else 8062 __ai __attribute__((target("neon"))) uint8x8_t vclz_u8(uint8x8_t __p0) { 8063 uint8x8_t __ret; 8064 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 8065 __ret = (uint8x8_t) __builtin_neon_vclz_v((int8x8_t)__rev0, 16); 8066 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 8067 return __ret; 8068 } 8069 #endif 8070 8071 #ifdef __LITTLE_ENDIAN__ 8072 __ai __attribute__((target("neon"))) uint32x2_t vclz_u32(uint32x2_t __p0) { 8073 uint32x2_t __ret; 8074 __ret = (uint32x2_t) __builtin_neon_vclz_v((int8x8_t)__p0, 18); 8075 return __ret; 8076 } 8077 #else 8078 __ai __attribute__((target("neon"))) uint32x2_t vclz_u32(uint32x2_t __p0) { 8079 uint32x2_t __ret; 8080 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 8081 __ret = (uint32x2_t) __builtin_neon_vclz_v((int8x8_t)__rev0, 18); 8082 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 8083 return __ret; 8084 } 8085 #endif 8086 8087 #ifdef __LITTLE_ENDIAN__ 8088 __ai __attribute__((target("neon"))) uint16x4_t vclz_u16(uint16x4_t __p0) { 8089 uint16x4_t __ret; 8090 __ret = (uint16x4_t) __builtin_neon_vclz_v((int8x8_t)__p0, 17); 8091 return __ret; 8092 } 8093 #else 8094 __ai __attribute__((target("neon"))) uint16x4_t vclz_u16(uint16x4_t __p0) { 8095 uint16x4_t __ret; 8096 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 8097 __ret = (uint16x4_t) __builtin_neon_vclz_v((int8x8_t)__rev0, 17); 8098 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 8099 return __ret; 8100 } 8101 #endif 8102 8103 #ifdef __LITTLE_ENDIAN__ 8104 __ai __attribute__((target("neon"))) int8x8_t vclz_s8(int8x8_t __p0) { 8105 int8x8_t __ret; 8106 __ret = (int8x8_t) __builtin_neon_vclz_v((int8x8_t)__p0, 0); 8107 return __ret; 8108 } 8109 #else 8110 __ai __attribute__((target("neon"))) int8x8_t vclz_s8(int8x8_t __p0) { 8111 int8x8_t __ret; 8112 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 8113 __ret = (int8x8_t) __builtin_neon_vclz_v((int8x8_t)__rev0, 0); 8114 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 8115 return __ret; 8116 } 8117 #endif 8118 8119 #ifdef __LITTLE_ENDIAN__ 8120 __ai __attribute__((target("neon"))) int32x2_t vclz_s32(int32x2_t __p0) { 8121 int32x2_t __ret; 8122 __ret = (int32x2_t) __builtin_neon_vclz_v((int8x8_t)__p0, 2); 8123 return __ret; 8124 } 8125 #else 8126 __ai __attribute__((target("neon"))) int32x2_t vclz_s32(int32x2_t __p0) { 8127 int32x2_t __ret; 8128 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 8129 __ret = (int32x2_t) __builtin_neon_vclz_v((int8x8_t)__rev0, 2); 8130 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 8131 return __ret; 8132 } 8133 #endif 8134 8135 #ifdef __LITTLE_ENDIAN__ 8136 __ai __attribute__((target("neon"))) int16x4_t vclz_s16(int16x4_t __p0) { 8137 int16x4_t __ret; 8138 __ret = (int16x4_t) __builtin_neon_vclz_v((int8x8_t)__p0, 1); 8139 return __ret; 8140 } 8141 #else 8142 __ai __attribute__((target("neon"))) int16x4_t vclz_s16(int16x4_t __p0) { 8143 int16x4_t __ret; 8144 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 8145 __ret = (int16x4_t) __builtin_neon_vclz_v((int8x8_t)__rev0, 1); 8146 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 8147 return __ret; 8148 } 8149 #endif 8150 8151 #ifdef __LITTLE_ENDIAN__ 8152 __ai __attribute__((target("neon"))) poly8x8_t vcnt_p8(poly8x8_t __p0) { 8153 poly8x8_t __ret; 8154 __ret = (poly8x8_t) __builtin_neon_vcnt_v((int8x8_t)__p0, 4); 8155 return __ret; 8156 } 8157 #else 8158 __ai __attribute__((target("neon"))) poly8x8_t vcnt_p8(poly8x8_t __p0) { 8159 poly8x8_t __ret; 8160 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 8161 __ret = (poly8x8_t) __builtin_neon_vcnt_v((int8x8_t)__rev0, 4); 8162 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 8163 return __ret; 8164 } 8165 #endif 8166 8167 #ifdef __LITTLE_ENDIAN__ 8168 __ai __attribute__((target("neon"))) poly8x16_t vcntq_p8(poly8x16_t __p0) { 8169 poly8x16_t __ret; 8170 __ret = (poly8x16_t) __builtin_neon_vcntq_v((int8x16_t)__p0, 36); 8171 return __ret; 8172 } 8173 #else 8174 __ai __attribute__((target("neon"))) poly8x16_t vcntq_p8(poly8x16_t __p0) { 8175 poly8x16_t __ret; 8176 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 8177 __ret = (poly8x16_t) __builtin_neon_vcntq_v((int8x16_t)__rev0, 36); 8178 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 8179 return __ret; 8180 } 8181 #endif 8182 8183 #ifdef __LITTLE_ENDIAN__ 8184 __ai __attribute__((target("neon"))) uint8x16_t vcntq_u8(uint8x16_t __p0) { 8185 uint8x16_t __ret; 8186 __ret = (uint8x16_t) __builtin_neon_vcntq_v((int8x16_t)__p0, 48); 8187 return __ret; 8188 } 8189 #else 8190 __ai __attribute__((target("neon"))) uint8x16_t vcntq_u8(uint8x16_t __p0) { 8191 uint8x16_t __ret; 8192 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 8193 __ret = (uint8x16_t) __builtin_neon_vcntq_v((int8x16_t)__rev0, 48); 8194 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 8195 return __ret; 8196 } 8197 #endif 8198 8199 #ifdef __LITTLE_ENDIAN__ 8200 __ai __attribute__((target("neon"))) int8x16_t vcntq_s8(int8x16_t __p0) { 8201 int8x16_t __ret; 8202 __ret = (int8x16_t) __builtin_neon_vcntq_v((int8x16_t)__p0, 32); 8203 return __ret; 8204 } 8205 #else 8206 __ai __attribute__((target("neon"))) int8x16_t vcntq_s8(int8x16_t __p0) { 8207 int8x16_t __ret; 8208 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 8209 __ret = (int8x16_t) __builtin_neon_vcntq_v((int8x16_t)__rev0, 32); 8210 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 8211 return __ret; 8212 } 8213 #endif 8214 8215 #ifdef __LITTLE_ENDIAN__ 8216 __ai __attribute__((target("neon"))) uint8x8_t vcnt_u8(uint8x8_t __p0) { 8217 uint8x8_t __ret; 8218 __ret = (uint8x8_t) __builtin_neon_vcnt_v((int8x8_t)__p0, 16); 8219 return __ret; 8220 } 8221 #else 8222 __ai __attribute__((target("neon"))) uint8x8_t vcnt_u8(uint8x8_t __p0) { 8223 uint8x8_t __ret; 8224 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 8225 __ret = (uint8x8_t) __builtin_neon_vcnt_v((int8x8_t)__rev0, 16); 8226 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 8227 return __ret; 8228 } 8229 #endif 8230 8231 #ifdef __LITTLE_ENDIAN__ 8232 __ai __attribute__((target("neon"))) int8x8_t vcnt_s8(int8x8_t __p0) { 8233 int8x8_t __ret; 8234 __ret = (int8x8_t) __builtin_neon_vcnt_v((int8x8_t)__p0, 0); 8235 return __ret; 8236 } 8237 #else 8238 __ai __attribute__((target("neon"))) int8x8_t vcnt_s8(int8x8_t __p0) { 8239 int8x8_t __ret; 8240 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 8241 __ret = (int8x8_t) __builtin_neon_vcnt_v((int8x8_t)__rev0, 0); 8242 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 8243 return __ret; 8244 } 8245 #endif 8246 8247 #ifdef __LITTLE_ENDIAN__ 8248 __ai __attribute__((target("neon"))) poly8x16_t vcombine_p8(poly8x8_t __p0, poly8x8_t __p1) { 8249 poly8x16_t __ret; 8250 __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15); 8251 return __ret; 8252 } 8253 #else 8254 __ai __attribute__((target("neon"))) poly8x16_t vcombine_p8(poly8x8_t __p0, poly8x8_t __p1) { 8255 poly8x16_t __ret; 8256 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 8257 poly8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 8258 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15); 8259 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 8260 return __ret; 8261 } 8262 #endif 8263 8264 #ifdef __LITTLE_ENDIAN__ 8265 __ai __attribute__((target("neon"))) poly16x8_t vcombine_p16(poly16x4_t __p0, poly16x4_t __p1) { 8266 poly16x8_t __ret; 8267 __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3, 4, 5, 6, 7); 8268 return __ret; 8269 } 8270 #else 8271 __ai __attribute__((target("neon"))) poly16x8_t vcombine_p16(poly16x4_t __p0, poly16x4_t __p1) { 8272 poly16x8_t __ret; 8273 poly16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 8274 poly16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 8275 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 1, 2, 3, 4, 5, 6, 7); 8276 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 8277 return __ret; 8278 } 8279 #endif 8280 8281 #ifdef __LITTLE_ENDIAN__ 8282 __ai __attribute__((target("neon"))) uint8x16_t vcombine_u8(uint8x8_t __p0, uint8x8_t __p1) { 8283 uint8x16_t __ret; 8284 __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15); 8285 return __ret; 8286 } 8287 #else 8288 __ai __attribute__((target("neon"))) uint8x16_t vcombine_u8(uint8x8_t __p0, uint8x8_t __p1) { 8289 uint8x16_t __ret; 8290 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 8291 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 8292 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15); 8293 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 8294 return __ret; 8295 } 8296 __ai __attribute__((target("neon"))) uint8x16_t __noswap_vcombine_u8(uint8x8_t __p0, uint8x8_t __p1) { 8297 uint8x16_t __ret; 8298 __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15); 8299 return __ret; 8300 } 8301 #endif 8302 8303 #ifdef __LITTLE_ENDIAN__ 8304 __ai __attribute__((target("neon"))) uint32x4_t vcombine_u32(uint32x2_t __p0, uint32x2_t __p1) { 8305 uint32x4_t __ret; 8306 __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3); 8307 return __ret; 8308 } 8309 #else 8310 __ai __attribute__((target("neon"))) uint32x4_t vcombine_u32(uint32x2_t __p0, uint32x2_t __p1) { 8311 uint32x4_t __ret; 8312 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 8313 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 8314 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 1, 2, 3); 8315 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 8316 return __ret; 8317 } 8318 __ai __attribute__((target("neon"))) uint32x4_t __noswap_vcombine_u32(uint32x2_t __p0, uint32x2_t __p1) { 8319 uint32x4_t __ret; 8320 __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3); 8321 return __ret; 8322 } 8323 #endif 8324 8325 #ifdef __LITTLE_ENDIAN__ 8326 __ai __attribute__((target("neon"))) uint64x2_t vcombine_u64(uint64x1_t __p0, uint64x1_t __p1) { 8327 uint64x2_t __ret; 8328 __ret = __builtin_shufflevector(__p0, __p1, 0, 1); 8329 return __ret; 8330 } 8331 #else 8332 __ai __attribute__((target("neon"))) uint64x2_t vcombine_u64(uint64x1_t __p0, uint64x1_t __p1) { 8333 uint64x2_t __ret; 8334 __ret = __builtin_shufflevector(__p0, __p1, 0, 1); 8335 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 8336 return __ret; 8337 } 8338 #endif 8339 8340 #ifdef __LITTLE_ENDIAN__ 8341 __ai __attribute__((target("neon"))) uint16x8_t vcombine_u16(uint16x4_t __p0, uint16x4_t __p1) { 8342 uint16x8_t __ret; 8343 __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3, 4, 5, 6, 7); 8344 return __ret; 8345 } 8346 #else 8347 __ai __attribute__((target("neon"))) uint16x8_t vcombine_u16(uint16x4_t __p0, uint16x4_t __p1) { 8348 uint16x8_t __ret; 8349 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 8350 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 8351 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 1, 2, 3, 4, 5, 6, 7); 8352 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 8353 return __ret; 8354 } 8355 __ai __attribute__((target("neon"))) uint16x8_t __noswap_vcombine_u16(uint16x4_t __p0, uint16x4_t __p1) { 8356 uint16x8_t __ret; 8357 __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3, 4, 5, 6, 7); 8358 return __ret; 8359 } 8360 #endif 8361 8362 #ifdef __LITTLE_ENDIAN__ 8363 __ai __attribute__((target("neon"))) int8x16_t vcombine_s8(int8x8_t __p0, int8x8_t __p1) { 8364 int8x16_t __ret; 8365 __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15); 8366 return __ret; 8367 } 8368 #else 8369 __ai __attribute__((target("neon"))) int8x16_t vcombine_s8(int8x8_t __p0, int8x8_t __p1) { 8370 int8x16_t __ret; 8371 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 8372 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 8373 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15); 8374 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 8375 return __ret; 8376 } 8377 __ai __attribute__((target("neon"))) int8x16_t __noswap_vcombine_s8(int8x8_t __p0, int8x8_t __p1) { 8378 int8x16_t __ret; 8379 __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15); 8380 return __ret; 8381 } 8382 #endif 8383 8384 #ifdef __LITTLE_ENDIAN__ 8385 __ai __attribute__((target("neon"))) float32x4_t vcombine_f32(float32x2_t __p0, float32x2_t __p1) { 8386 float32x4_t __ret; 8387 __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3); 8388 return __ret; 8389 } 8390 #else 8391 __ai __attribute__((target("neon"))) float32x4_t vcombine_f32(float32x2_t __p0, float32x2_t __p1) { 8392 float32x4_t __ret; 8393 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 8394 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 8395 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 1, 2, 3); 8396 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 8397 return __ret; 8398 } 8399 __ai __attribute__((target("neon"))) float32x4_t __noswap_vcombine_f32(float32x2_t __p0, float32x2_t __p1) { 8400 float32x4_t __ret; 8401 __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3); 8402 return __ret; 8403 } 8404 #endif 8405 8406 #ifdef __LITTLE_ENDIAN__ 8407 __ai __attribute__((target("neon"))) float16x8_t vcombine_f16(float16x4_t __p0, float16x4_t __p1) { 8408 float16x8_t __ret; 8409 __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3, 4, 5, 6, 7); 8410 return __ret; 8411 } 8412 #else 8413 __ai __attribute__((target("neon"))) float16x8_t vcombine_f16(float16x4_t __p0, float16x4_t __p1) { 8414 float16x8_t __ret; 8415 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 8416 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 8417 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 1, 2, 3, 4, 5, 6, 7); 8418 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 8419 return __ret; 8420 } 8421 __ai __attribute__((target("neon"))) float16x8_t __noswap_vcombine_f16(float16x4_t __p0, float16x4_t __p1) { 8422 float16x8_t __ret; 8423 __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3, 4, 5, 6, 7); 8424 return __ret; 8425 } 8426 #endif 8427 8428 #ifdef __LITTLE_ENDIAN__ 8429 __ai __attribute__((target("neon"))) int32x4_t vcombine_s32(int32x2_t __p0, int32x2_t __p1) { 8430 int32x4_t __ret; 8431 __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3); 8432 return __ret; 8433 } 8434 #else 8435 __ai __attribute__((target("neon"))) int32x4_t vcombine_s32(int32x2_t __p0, int32x2_t __p1) { 8436 int32x4_t __ret; 8437 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 8438 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 8439 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 1, 2, 3); 8440 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 8441 return __ret; 8442 } 8443 __ai __attribute__((target("neon"))) int32x4_t __noswap_vcombine_s32(int32x2_t __p0, int32x2_t __p1) { 8444 int32x4_t __ret; 8445 __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3); 8446 return __ret; 8447 } 8448 #endif 8449 8450 #ifdef __LITTLE_ENDIAN__ 8451 __ai __attribute__((target("neon"))) int64x2_t vcombine_s64(int64x1_t __p0, int64x1_t __p1) { 8452 int64x2_t __ret; 8453 __ret = __builtin_shufflevector(__p0, __p1, 0, 1); 8454 return __ret; 8455 } 8456 #else 8457 __ai __attribute__((target("neon"))) int64x2_t vcombine_s64(int64x1_t __p0, int64x1_t __p1) { 8458 int64x2_t __ret; 8459 __ret = __builtin_shufflevector(__p0, __p1, 0, 1); 8460 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 8461 return __ret; 8462 } 8463 #endif 8464 8465 #ifdef __LITTLE_ENDIAN__ 8466 __ai __attribute__((target("neon"))) int16x8_t vcombine_s16(int16x4_t __p0, int16x4_t __p1) { 8467 int16x8_t __ret; 8468 __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3, 4, 5, 6, 7); 8469 return __ret; 8470 } 8471 #else 8472 __ai __attribute__((target("neon"))) int16x8_t vcombine_s16(int16x4_t __p0, int16x4_t __p1) { 8473 int16x8_t __ret; 8474 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 8475 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 8476 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 1, 2, 3, 4, 5, 6, 7); 8477 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 8478 return __ret; 8479 } 8480 __ai __attribute__((target("neon"))) int16x8_t __noswap_vcombine_s16(int16x4_t __p0, int16x4_t __p1) { 8481 int16x8_t __ret; 8482 __ret = __builtin_shufflevector(__p0, __p1, 0, 1, 2, 3, 4, 5, 6, 7); 8483 return __ret; 8484 } 8485 #endif 8486 8487 #define vcreate_p8(__p0) __extension__ ({ \ 8488 poly8x8_t __ret; \ 8489 uint64_t __promote = __p0; \ 8490 __ret = (poly8x8_t)(__promote); \ 8491 __ret; \ 8492 }) 8493 #define vcreate_p16(__p0) __extension__ ({ \ 8494 poly16x4_t __ret; \ 8495 uint64_t __promote = __p0; \ 8496 __ret = (poly16x4_t)(__promote); \ 8497 __ret; \ 8498 }) 8499 #define vcreate_u8(__p0) __extension__ ({ \ 8500 uint8x8_t __ret; \ 8501 uint64_t __promote = __p0; \ 8502 __ret = (uint8x8_t)(__promote); \ 8503 __ret; \ 8504 }) 8505 #define vcreate_u32(__p0) __extension__ ({ \ 8506 uint32x2_t __ret; \ 8507 uint64_t __promote = __p0; \ 8508 __ret = (uint32x2_t)(__promote); \ 8509 __ret; \ 8510 }) 8511 #define vcreate_u64(__p0) __extension__ ({ \ 8512 uint64x1_t __ret; \ 8513 uint64_t __promote = __p0; \ 8514 __ret = (uint64x1_t)(__promote); \ 8515 __ret; \ 8516 }) 8517 #define vcreate_u16(__p0) __extension__ ({ \ 8518 uint16x4_t __ret; \ 8519 uint64_t __promote = __p0; \ 8520 __ret = (uint16x4_t)(__promote); \ 8521 __ret; \ 8522 }) 8523 #define vcreate_s8(__p0) __extension__ ({ \ 8524 int8x8_t __ret; \ 8525 uint64_t __promote = __p0; \ 8526 __ret = (int8x8_t)(__promote); \ 8527 __ret; \ 8528 }) 8529 #define vcreate_f32(__p0) __extension__ ({ \ 8530 float32x2_t __ret; \ 8531 uint64_t __promote = __p0; \ 8532 __ret = (float32x2_t)(__promote); \ 8533 __ret; \ 8534 }) 8535 #define vcreate_f16(__p0) __extension__ ({ \ 8536 float16x4_t __ret; \ 8537 uint64_t __promote = __p0; \ 8538 __ret = (float16x4_t)(__promote); \ 8539 __ret; \ 8540 }) 8541 #define vcreate_s32(__p0) __extension__ ({ \ 8542 int32x2_t __ret; \ 8543 uint64_t __promote = __p0; \ 8544 __ret = (int32x2_t)(__promote); \ 8545 __ret; \ 8546 }) 8547 #define vcreate_s64(__p0) __extension__ ({ \ 8548 int64x1_t __ret; \ 8549 uint64_t __promote = __p0; \ 8550 __ret = (int64x1_t)(__promote); \ 8551 __ret; \ 8552 }) 8553 #define vcreate_s16(__p0) __extension__ ({ \ 8554 int16x4_t __ret; \ 8555 uint64_t __promote = __p0; \ 8556 __ret = (int16x4_t)(__promote); \ 8557 __ret; \ 8558 }) 8559 #ifdef __LITTLE_ENDIAN__ 8560 __ai __attribute__((target("neon"))) float32x4_t vcvtq_f32_u32(uint32x4_t __p0) { 8561 float32x4_t __ret; 8562 __ret = (float32x4_t) __builtin_neon_vcvtq_f32_v((int8x16_t)__p0, 50); 8563 return __ret; 8564 } 8565 #else 8566 __ai __attribute__((target("neon"))) float32x4_t vcvtq_f32_u32(uint32x4_t __p0) { 8567 float32x4_t __ret; 8568 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 8569 __ret = (float32x4_t) __builtin_neon_vcvtq_f32_v((int8x16_t)__rev0, 50); 8570 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 8571 return __ret; 8572 } 8573 #endif 8574 8575 #ifdef __LITTLE_ENDIAN__ 8576 __ai __attribute__((target("neon"))) float32x4_t vcvtq_f32_s32(int32x4_t __p0) { 8577 float32x4_t __ret; 8578 __ret = (float32x4_t) __builtin_neon_vcvtq_f32_v((int8x16_t)__p0, 34); 8579 return __ret; 8580 } 8581 #else 8582 __ai __attribute__((target("neon"))) float32x4_t vcvtq_f32_s32(int32x4_t __p0) { 8583 float32x4_t __ret; 8584 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 8585 __ret = (float32x4_t) __builtin_neon_vcvtq_f32_v((int8x16_t)__rev0, 34); 8586 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 8587 return __ret; 8588 } 8589 #endif 8590 8591 #ifdef __LITTLE_ENDIAN__ 8592 __ai __attribute__((target("neon"))) float32x2_t vcvt_f32_u32(uint32x2_t __p0) { 8593 float32x2_t __ret; 8594 __ret = (float32x2_t) __builtin_neon_vcvt_f32_v((int8x8_t)__p0, 18); 8595 return __ret; 8596 } 8597 #else 8598 __ai __attribute__((target("neon"))) float32x2_t vcvt_f32_u32(uint32x2_t __p0) { 8599 float32x2_t __ret; 8600 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 8601 __ret = (float32x2_t) __builtin_neon_vcvt_f32_v((int8x8_t)__rev0, 18); 8602 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 8603 return __ret; 8604 } 8605 #endif 8606 8607 #ifdef __LITTLE_ENDIAN__ 8608 __ai __attribute__((target("neon"))) float32x2_t vcvt_f32_s32(int32x2_t __p0) { 8609 float32x2_t __ret; 8610 __ret = (float32x2_t) __builtin_neon_vcvt_f32_v((int8x8_t)__p0, 2); 8611 return __ret; 8612 } 8613 #else 8614 __ai __attribute__((target("neon"))) float32x2_t vcvt_f32_s32(int32x2_t __p0) { 8615 float32x2_t __ret; 8616 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 8617 __ret = (float32x2_t) __builtin_neon_vcvt_f32_v((int8x8_t)__rev0, 2); 8618 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 8619 return __ret; 8620 } 8621 #endif 8622 8623 #ifdef __LITTLE_ENDIAN__ 8624 #define vcvtq_n_f32_u32(__p0, __p1) __extension__ ({ \ 8625 float32x4_t __ret; \ 8626 uint32x4_t __s0 = __p0; \ 8627 __ret = (float32x4_t) __builtin_neon_vcvtq_n_f32_v((int8x16_t)__s0, __p1, 50); \ 8628 __ret; \ 8629 }) 8630 #else 8631 #define vcvtq_n_f32_u32(__p0, __p1) __extension__ ({ \ 8632 float32x4_t __ret; \ 8633 uint32x4_t __s0 = __p0; \ 8634 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 8635 __ret = (float32x4_t) __builtin_neon_vcvtq_n_f32_v((int8x16_t)__rev0, __p1, 50); \ 8636 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 8637 __ret; \ 8638 }) 8639 #endif 8640 8641 #ifdef __LITTLE_ENDIAN__ 8642 #define vcvtq_n_f32_s32(__p0, __p1) __extension__ ({ \ 8643 float32x4_t __ret; \ 8644 int32x4_t __s0 = __p0; \ 8645 __ret = (float32x4_t) __builtin_neon_vcvtq_n_f32_v((int8x16_t)__s0, __p1, 34); \ 8646 __ret; \ 8647 }) 8648 #else 8649 #define vcvtq_n_f32_s32(__p0, __p1) __extension__ ({ \ 8650 float32x4_t __ret; \ 8651 int32x4_t __s0 = __p0; \ 8652 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 8653 __ret = (float32x4_t) __builtin_neon_vcvtq_n_f32_v((int8x16_t)__rev0, __p1, 34); \ 8654 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 8655 __ret; \ 8656 }) 8657 #endif 8658 8659 #ifdef __LITTLE_ENDIAN__ 8660 #define vcvt_n_f32_u32(__p0, __p1) __extension__ ({ \ 8661 float32x2_t __ret; \ 8662 uint32x2_t __s0 = __p0; \ 8663 __ret = (float32x2_t) __builtin_neon_vcvt_n_f32_v((int8x8_t)__s0, __p1, 18); \ 8664 __ret; \ 8665 }) 8666 #else 8667 #define vcvt_n_f32_u32(__p0, __p1) __extension__ ({ \ 8668 float32x2_t __ret; \ 8669 uint32x2_t __s0 = __p0; \ 8670 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 8671 __ret = (float32x2_t) __builtin_neon_vcvt_n_f32_v((int8x8_t)__rev0, __p1, 18); \ 8672 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 8673 __ret; \ 8674 }) 8675 #endif 8676 8677 #ifdef __LITTLE_ENDIAN__ 8678 #define vcvt_n_f32_s32(__p0, __p1) __extension__ ({ \ 8679 float32x2_t __ret; \ 8680 int32x2_t __s0 = __p0; \ 8681 __ret = (float32x2_t) __builtin_neon_vcvt_n_f32_v((int8x8_t)__s0, __p1, 2); \ 8682 __ret; \ 8683 }) 8684 #else 8685 #define vcvt_n_f32_s32(__p0, __p1) __extension__ ({ \ 8686 float32x2_t __ret; \ 8687 int32x2_t __s0 = __p0; \ 8688 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 8689 __ret = (float32x2_t) __builtin_neon_vcvt_n_f32_v((int8x8_t)__rev0, __p1, 2); \ 8690 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 8691 __ret; \ 8692 }) 8693 #endif 8694 8695 #ifdef __LITTLE_ENDIAN__ 8696 #define vcvtq_n_s32_f32(__p0, __p1) __extension__ ({ \ 8697 int32x4_t __ret; \ 8698 float32x4_t __s0 = __p0; \ 8699 __ret = (int32x4_t) __builtin_neon_vcvtq_n_s32_v((int8x16_t)__s0, __p1, 34); \ 8700 __ret; \ 8701 }) 8702 #else 8703 #define vcvtq_n_s32_f32(__p0, __p1) __extension__ ({ \ 8704 int32x4_t __ret; \ 8705 float32x4_t __s0 = __p0; \ 8706 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 8707 __ret = (int32x4_t) __builtin_neon_vcvtq_n_s32_v((int8x16_t)__rev0, __p1, 34); \ 8708 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 8709 __ret; \ 8710 }) 8711 #endif 8712 8713 #ifdef __LITTLE_ENDIAN__ 8714 #define vcvt_n_s32_f32(__p0, __p1) __extension__ ({ \ 8715 int32x2_t __ret; \ 8716 float32x2_t __s0 = __p0; \ 8717 __ret = (int32x2_t) __builtin_neon_vcvt_n_s32_v((int8x8_t)__s0, __p1, 2); \ 8718 __ret; \ 8719 }) 8720 #else 8721 #define vcvt_n_s32_f32(__p0, __p1) __extension__ ({ \ 8722 int32x2_t __ret; \ 8723 float32x2_t __s0 = __p0; \ 8724 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 8725 __ret = (int32x2_t) __builtin_neon_vcvt_n_s32_v((int8x8_t)__rev0, __p1, 2); \ 8726 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 8727 __ret; \ 8728 }) 8729 #endif 8730 8731 #ifdef __LITTLE_ENDIAN__ 8732 #define vcvtq_n_u32_f32(__p0, __p1) __extension__ ({ \ 8733 uint32x4_t __ret; \ 8734 float32x4_t __s0 = __p0; \ 8735 __ret = (uint32x4_t) __builtin_neon_vcvtq_n_u32_v((int8x16_t)__s0, __p1, 50); \ 8736 __ret; \ 8737 }) 8738 #else 8739 #define vcvtq_n_u32_f32(__p0, __p1) __extension__ ({ \ 8740 uint32x4_t __ret; \ 8741 float32x4_t __s0 = __p0; \ 8742 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 8743 __ret = (uint32x4_t) __builtin_neon_vcvtq_n_u32_v((int8x16_t)__rev0, __p1, 50); \ 8744 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 8745 __ret; \ 8746 }) 8747 #endif 8748 8749 #ifdef __LITTLE_ENDIAN__ 8750 #define vcvt_n_u32_f32(__p0, __p1) __extension__ ({ \ 8751 uint32x2_t __ret; \ 8752 float32x2_t __s0 = __p0; \ 8753 __ret = (uint32x2_t) __builtin_neon_vcvt_n_u32_v((int8x8_t)__s0, __p1, 18); \ 8754 __ret; \ 8755 }) 8756 #else 8757 #define vcvt_n_u32_f32(__p0, __p1) __extension__ ({ \ 8758 uint32x2_t __ret; \ 8759 float32x2_t __s0 = __p0; \ 8760 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 8761 __ret = (uint32x2_t) __builtin_neon_vcvt_n_u32_v((int8x8_t)__rev0, __p1, 18); \ 8762 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 8763 __ret; \ 8764 }) 8765 #endif 8766 8767 #ifdef __LITTLE_ENDIAN__ 8768 __ai __attribute__((target("neon"))) int32x4_t vcvtq_s32_f32(float32x4_t __p0) { 8769 int32x4_t __ret; 8770 __ret = (int32x4_t) __builtin_neon_vcvtq_s32_v((int8x16_t)__p0, 34); 8771 return __ret; 8772 } 8773 #else 8774 __ai __attribute__((target("neon"))) int32x4_t vcvtq_s32_f32(float32x4_t __p0) { 8775 int32x4_t __ret; 8776 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 8777 __ret = (int32x4_t) __builtin_neon_vcvtq_s32_v((int8x16_t)__rev0, 34); 8778 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 8779 return __ret; 8780 } 8781 #endif 8782 8783 #ifdef __LITTLE_ENDIAN__ 8784 __ai __attribute__((target("neon"))) int32x2_t vcvt_s32_f32(float32x2_t __p0) { 8785 int32x2_t __ret; 8786 __ret = (int32x2_t) __builtin_neon_vcvt_s32_v((int8x8_t)__p0, 2); 8787 return __ret; 8788 } 8789 #else 8790 __ai __attribute__((target("neon"))) int32x2_t vcvt_s32_f32(float32x2_t __p0) { 8791 int32x2_t __ret; 8792 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 8793 __ret = (int32x2_t) __builtin_neon_vcvt_s32_v((int8x8_t)__rev0, 2); 8794 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 8795 return __ret; 8796 } 8797 #endif 8798 8799 #ifdef __LITTLE_ENDIAN__ 8800 __ai __attribute__((target("neon"))) uint32x4_t vcvtq_u32_f32(float32x4_t __p0) { 8801 uint32x4_t __ret; 8802 __ret = (uint32x4_t) __builtin_neon_vcvtq_u32_v((int8x16_t)__p0, 50); 8803 return __ret; 8804 } 8805 #else 8806 __ai __attribute__((target("neon"))) uint32x4_t vcvtq_u32_f32(float32x4_t __p0) { 8807 uint32x4_t __ret; 8808 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 8809 __ret = (uint32x4_t) __builtin_neon_vcvtq_u32_v((int8x16_t)__rev0, 50); 8810 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 8811 return __ret; 8812 } 8813 #endif 8814 8815 #ifdef __LITTLE_ENDIAN__ 8816 __ai __attribute__((target("neon"))) uint32x2_t vcvt_u32_f32(float32x2_t __p0) { 8817 uint32x2_t __ret; 8818 __ret = (uint32x2_t) __builtin_neon_vcvt_u32_v((int8x8_t)__p0, 18); 8819 return __ret; 8820 } 8821 #else 8822 __ai __attribute__((target("neon"))) uint32x2_t vcvt_u32_f32(float32x2_t __p0) { 8823 uint32x2_t __ret; 8824 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 8825 __ret = (uint32x2_t) __builtin_neon_vcvt_u32_v((int8x8_t)__rev0, 18); 8826 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 8827 return __ret; 8828 } 8829 #endif 8830 8831 #ifdef __LITTLE_ENDIAN__ 8832 #define vdup_lane_p8(__p0_8, __p1_8) __extension__ ({ \ 8833 poly8x8_t __ret_8; \ 8834 poly8x8_t __s0_8 = __p0_8; \ 8835 __ret_8 = splat_lane_p8(__s0_8, __p1_8); \ 8836 __ret_8; \ 8837 }) 8838 #else 8839 #define vdup_lane_p8(__p0_9, __p1_9) __extension__ ({ \ 8840 poly8x8_t __ret_9; \ 8841 poly8x8_t __s0_9 = __p0_9; \ 8842 poly8x8_t __rev0_9; __rev0_9 = __builtin_shufflevector(__s0_9, __s0_9, 7, 6, 5, 4, 3, 2, 1, 0); \ 8843 __ret_9 = __noswap_splat_lane_p8(__rev0_9, __p1_9); \ 8844 __ret_9 = __builtin_shufflevector(__ret_9, __ret_9, 7, 6, 5, 4, 3, 2, 1, 0); \ 8845 __ret_9; \ 8846 }) 8847 #endif 8848 8849 #ifdef __LITTLE_ENDIAN__ 8850 #define vdup_lane_p16(__p0_10, __p1_10) __extension__ ({ \ 8851 poly16x4_t __ret_10; \ 8852 poly16x4_t __s0_10 = __p0_10; \ 8853 __ret_10 = splat_lane_p16(__s0_10, __p1_10); \ 8854 __ret_10; \ 8855 }) 8856 #else 8857 #define vdup_lane_p16(__p0_11, __p1_11) __extension__ ({ \ 8858 poly16x4_t __ret_11; \ 8859 poly16x4_t __s0_11 = __p0_11; \ 8860 poly16x4_t __rev0_11; __rev0_11 = __builtin_shufflevector(__s0_11, __s0_11, 3, 2, 1, 0); \ 8861 __ret_11 = __noswap_splat_lane_p16(__rev0_11, __p1_11); \ 8862 __ret_11 = __builtin_shufflevector(__ret_11, __ret_11, 3, 2, 1, 0); \ 8863 __ret_11; \ 8864 }) 8865 #endif 8866 8867 #ifdef __LITTLE_ENDIAN__ 8868 #define vdupq_lane_p8(__p0_12, __p1_12) __extension__ ({ \ 8869 poly8x16_t __ret_12; \ 8870 poly8x8_t __s0_12 = __p0_12; \ 8871 __ret_12 = splatq_lane_p8(__s0_12, __p1_12); \ 8872 __ret_12; \ 8873 }) 8874 #else 8875 #define vdupq_lane_p8(__p0_13, __p1_13) __extension__ ({ \ 8876 poly8x16_t __ret_13; \ 8877 poly8x8_t __s0_13 = __p0_13; \ 8878 poly8x8_t __rev0_13; __rev0_13 = __builtin_shufflevector(__s0_13, __s0_13, 7, 6, 5, 4, 3, 2, 1, 0); \ 8879 __ret_13 = __noswap_splatq_lane_p8(__rev0_13, __p1_13); \ 8880 __ret_13 = __builtin_shufflevector(__ret_13, __ret_13, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 8881 __ret_13; \ 8882 }) 8883 #endif 8884 8885 #ifdef __LITTLE_ENDIAN__ 8886 #define vdupq_lane_p16(__p0_14, __p1_14) __extension__ ({ \ 8887 poly16x8_t __ret_14; \ 8888 poly16x4_t __s0_14 = __p0_14; \ 8889 __ret_14 = splatq_lane_p16(__s0_14, __p1_14); \ 8890 __ret_14; \ 8891 }) 8892 #else 8893 #define vdupq_lane_p16(__p0_15, __p1_15) __extension__ ({ \ 8894 poly16x8_t __ret_15; \ 8895 poly16x4_t __s0_15 = __p0_15; \ 8896 poly16x4_t __rev0_15; __rev0_15 = __builtin_shufflevector(__s0_15, __s0_15, 3, 2, 1, 0); \ 8897 __ret_15 = __noswap_splatq_lane_p16(__rev0_15, __p1_15); \ 8898 __ret_15 = __builtin_shufflevector(__ret_15, __ret_15, 7, 6, 5, 4, 3, 2, 1, 0); \ 8899 __ret_15; \ 8900 }) 8901 #endif 8902 8903 #ifdef __LITTLE_ENDIAN__ 8904 #define vdupq_lane_u8(__p0_16, __p1_16) __extension__ ({ \ 8905 uint8x16_t __ret_16; \ 8906 uint8x8_t __s0_16 = __p0_16; \ 8907 __ret_16 = splatq_lane_u8(__s0_16, __p1_16); \ 8908 __ret_16; \ 8909 }) 8910 #else 8911 #define vdupq_lane_u8(__p0_17, __p1_17) __extension__ ({ \ 8912 uint8x16_t __ret_17; \ 8913 uint8x8_t __s0_17 = __p0_17; \ 8914 uint8x8_t __rev0_17; __rev0_17 = __builtin_shufflevector(__s0_17, __s0_17, 7, 6, 5, 4, 3, 2, 1, 0); \ 8915 __ret_17 = __noswap_splatq_lane_u8(__rev0_17, __p1_17); \ 8916 __ret_17 = __builtin_shufflevector(__ret_17, __ret_17, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 8917 __ret_17; \ 8918 }) 8919 #endif 8920 8921 #ifdef __LITTLE_ENDIAN__ 8922 #define vdupq_lane_u32(__p0_18, __p1_18) __extension__ ({ \ 8923 uint32x4_t __ret_18; \ 8924 uint32x2_t __s0_18 = __p0_18; \ 8925 __ret_18 = splatq_lane_u32(__s0_18, __p1_18); \ 8926 __ret_18; \ 8927 }) 8928 #else 8929 #define vdupq_lane_u32(__p0_19, __p1_19) __extension__ ({ \ 8930 uint32x4_t __ret_19; \ 8931 uint32x2_t __s0_19 = __p0_19; \ 8932 uint32x2_t __rev0_19; __rev0_19 = __builtin_shufflevector(__s0_19, __s0_19, 1, 0); \ 8933 __ret_19 = __noswap_splatq_lane_u32(__rev0_19, __p1_19); \ 8934 __ret_19 = __builtin_shufflevector(__ret_19, __ret_19, 3, 2, 1, 0); \ 8935 __ret_19; \ 8936 }) 8937 #endif 8938 8939 #ifdef __LITTLE_ENDIAN__ 8940 #define vdupq_lane_u64(__p0_20, __p1_20) __extension__ ({ \ 8941 uint64x2_t __ret_20; \ 8942 uint64x1_t __s0_20 = __p0_20; \ 8943 __ret_20 = splatq_lane_u64(__s0_20, __p1_20); \ 8944 __ret_20; \ 8945 }) 8946 #else 8947 #define vdupq_lane_u64(__p0_21, __p1_21) __extension__ ({ \ 8948 uint64x2_t __ret_21; \ 8949 uint64x1_t __s0_21 = __p0_21; \ 8950 __ret_21 = __noswap_splatq_lane_u64(__s0_21, __p1_21); \ 8951 __ret_21 = __builtin_shufflevector(__ret_21, __ret_21, 1, 0); \ 8952 __ret_21; \ 8953 }) 8954 #endif 8955 8956 #ifdef __LITTLE_ENDIAN__ 8957 #define vdupq_lane_u16(__p0_22, __p1_22) __extension__ ({ \ 8958 uint16x8_t __ret_22; \ 8959 uint16x4_t __s0_22 = __p0_22; \ 8960 __ret_22 = splatq_lane_u16(__s0_22, __p1_22); \ 8961 __ret_22; \ 8962 }) 8963 #else 8964 #define vdupq_lane_u16(__p0_23, __p1_23) __extension__ ({ \ 8965 uint16x8_t __ret_23; \ 8966 uint16x4_t __s0_23 = __p0_23; \ 8967 uint16x4_t __rev0_23; __rev0_23 = __builtin_shufflevector(__s0_23, __s0_23, 3, 2, 1, 0); \ 8968 __ret_23 = __noswap_splatq_lane_u16(__rev0_23, __p1_23); \ 8969 __ret_23 = __builtin_shufflevector(__ret_23, __ret_23, 7, 6, 5, 4, 3, 2, 1, 0); \ 8970 __ret_23; \ 8971 }) 8972 #endif 8973 8974 #ifdef __LITTLE_ENDIAN__ 8975 #define vdupq_lane_s8(__p0_24, __p1_24) __extension__ ({ \ 8976 int8x16_t __ret_24; \ 8977 int8x8_t __s0_24 = __p0_24; \ 8978 __ret_24 = splatq_lane_s8(__s0_24, __p1_24); \ 8979 __ret_24; \ 8980 }) 8981 #else 8982 #define vdupq_lane_s8(__p0_25, __p1_25) __extension__ ({ \ 8983 int8x16_t __ret_25; \ 8984 int8x8_t __s0_25 = __p0_25; \ 8985 int8x8_t __rev0_25; __rev0_25 = __builtin_shufflevector(__s0_25, __s0_25, 7, 6, 5, 4, 3, 2, 1, 0); \ 8986 __ret_25 = __noswap_splatq_lane_s8(__rev0_25, __p1_25); \ 8987 __ret_25 = __builtin_shufflevector(__ret_25, __ret_25, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 8988 __ret_25; \ 8989 }) 8990 #endif 8991 8992 #ifdef __LITTLE_ENDIAN__ 8993 #define vdupq_lane_f32(__p0_26, __p1_26) __extension__ ({ \ 8994 float32x4_t __ret_26; \ 8995 float32x2_t __s0_26 = __p0_26; \ 8996 __ret_26 = splatq_lane_f32(__s0_26, __p1_26); \ 8997 __ret_26; \ 8998 }) 8999 #else 9000 #define vdupq_lane_f32(__p0_27, __p1_27) __extension__ ({ \ 9001 float32x4_t __ret_27; \ 9002 float32x2_t __s0_27 = __p0_27; \ 9003 float32x2_t __rev0_27; __rev0_27 = __builtin_shufflevector(__s0_27, __s0_27, 1, 0); \ 9004 __ret_27 = __noswap_splatq_lane_f32(__rev0_27, __p1_27); \ 9005 __ret_27 = __builtin_shufflevector(__ret_27, __ret_27, 3, 2, 1, 0); \ 9006 __ret_27; \ 9007 }) 9008 #endif 9009 9010 #ifdef __LITTLE_ENDIAN__ 9011 #define vdupq_lane_f16(__p0_28, __p1_28) __extension__ ({ \ 9012 float16x8_t __ret_28; \ 9013 float16x4_t __s0_28 = __p0_28; \ 9014 __ret_28 = splatq_lane_f16(__s0_28, __p1_28); \ 9015 __ret_28; \ 9016 }) 9017 #else 9018 #define vdupq_lane_f16(__p0_29, __p1_29) __extension__ ({ \ 9019 float16x8_t __ret_29; \ 9020 float16x4_t __s0_29 = __p0_29; \ 9021 float16x4_t __rev0_29; __rev0_29 = __builtin_shufflevector(__s0_29, __s0_29, 3, 2, 1, 0); \ 9022 __ret_29 = __noswap_splatq_lane_f16(__rev0_29, __p1_29); \ 9023 __ret_29 = __builtin_shufflevector(__ret_29, __ret_29, 7, 6, 5, 4, 3, 2, 1, 0); \ 9024 __ret_29; \ 9025 }) 9026 #endif 9027 9028 #ifdef __LITTLE_ENDIAN__ 9029 #define vdupq_lane_s32(__p0_30, __p1_30) __extension__ ({ \ 9030 int32x4_t __ret_30; \ 9031 int32x2_t __s0_30 = __p0_30; \ 9032 __ret_30 = splatq_lane_s32(__s0_30, __p1_30); \ 9033 __ret_30; \ 9034 }) 9035 #else 9036 #define vdupq_lane_s32(__p0_31, __p1_31) __extension__ ({ \ 9037 int32x4_t __ret_31; \ 9038 int32x2_t __s0_31 = __p0_31; \ 9039 int32x2_t __rev0_31; __rev0_31 = __builtin_shufflevector(__s0_31, __s0_31, 1, 0); \ 9040 __ret_31 = __noswap_splatq_lane_s32(__rev0_31, __p1_31); \ 9041 __ret_31 = __builtin_shufflevector(__ret_31, __ret_31, 3, 2, 1, 0); \ 9042 __ret_31; \ 9043 }) 9044 #endif 9045 9046 #ifdef __LITTLE_ENDIAN__ 9047 #define vdupq_lane_s64(__p0_32, __p1_32) __extension__ ({ \ 9048 int64x2_t __ret_32; \ 9049 int64x1_t __s0_32 = __p0_32; \ 9050 __ret_32 = splatq_lane_s64(__s0_32, __p1_32); \ 9051 __ret_32; \ 9052 }) 9053 #else 9054 #define vdupq_lane_s64(__p0_33, __p1_33) __extension__ ({ \ 9055 int64x2_t __ret_33; \ 9056 int64x1_t __s0_33 = __p0_33; \ 9057 __ret_33 = __noswap_splatq_lane_s64(__s0_33, __p1_33); \ 9058 __ret_33 = __builtin_shufflevector(__ret_33, __ret_33, 1, 0); \ 9059 __ret_33; \ 9060 }) 9061 #endif 9062 9063 #ifdef __LITTLE_ENDIAN__ 9064 #define vdupq_lane_s16(__p0_34, __p1_34) __extension__ ({ \ 9065 int16x8_t __ret_34; \ 9066 int16x4_t __s0_34 = __p0_34; \ 9067 __ret_34 = splatq_lane_s16(__s0_34, __p1_34); \ 9068 __ret_34; \ 9069 }) 9070 #else 9071 #define vdupq_lane_s16(__p0_35, __p1_35) __extension__ ({ \ 9072 int16x8_t __ret_35; \ 9073 int16x4_t __s0_35 = __p0_35; \ 9074 int16x4_t __rev0_35; __rev0_35 = __builtin_shufflevector(__s0_35, __s0_35, 3, 2, 1, 0); \ 9075 __ret_35 = __noswap_splatq_lane_s16(__rev0_35, __p1_35); \ 9076 __ret_35 = __builtin_shufflevector(__ret_35, __ret_35, 7, 6, 5, 4, 3, 2, 1, 0); \ 9077 __ret_35; \ 9078 }) 9079 #endif 9080 9081 #ifdef __LITTLE_ENDIAN__ 9082 #define vdup_lane_u8(__p0_36, __p1_36) __extension__ ({ \ 9083 uint8x8_t __ret_36; \ 9084 uint8x8_t __s0_36 = __p0_36; \ 9085 __ret_36 = splat_lane_u8(__s0_36, __p1_36); \ 9086 __ret_36; \ 9087 }) 9088 #else 9089 #define vdup_lane_u8(__p0_37, __p1_37) __extension__ ({ \ 9090 uint8x8_t __ret_37; \ 9091 uint8x8_t __s0_37 = __p0_37; \ 9092 uint8x8_t __rev0_37; __rev0_37 = __builtin_shufflevector(__s0_37, __s0_37, 7, 6, 5, 4, 3, 2, 1, 0); \ 9093 __ret_37 = __noswap_splat_lane_u8(__rev0_37, __p1_37); \ 9094 __ret_37 = __builtin_shufflevector(__ret_37, __ret_37, 7, 6, 5, 4, 3, 2, 1, 0); \ 9095 __ret_37; \ 9096 }) 9097 #endif 9098 9099 #ifdef __LITTLE_ENDIAN__ 9100 #define vdup_lane_u32(__p0_38, __p1_38) __extension__ ({ \ 9101 uint32x2_t __ret_38; \ 9102 uint32x2_t __s0_38 = __p0_38; \ 9103 __ret_38 = splat_lane_u32(__s0_38, __p1_38); \ 9104 __ret_38; \ 9105 }) 9106 #else 9107 #define vdup_lane_u32(__p0_39, __p1_39) __extension__ ({ \ 9108 uint32x2_t __ret_39; \ 9109 uint32x2_t __s0_39 = __p0_39; \ 9110 uint32x2_t __rev0_39; __rev0_39 = __builtin_shufflevector(__s0_39, __s0_39, 1, 0); \ 9111 __ret_39 = __noswap_splat_lane_u32(__rev0_39, __p1_39); \ 9112 __ret_39 = __builtin_shufflevector(__ret_39, __ret_39, 1, 0); \ 9113 __ret_39; \ 9114 }) 9115 #endif 9116 9117 #define vdup_lane_u64(__p0_40, __p1_40) __extension__ ({ \ 9118 uint64x1_t __ret_40; \ 9119 uint64x1_t __s0_40 = __p0_40; \ 9120 __ret_40 = splat_lane_u64(__s0_40, __p1_40); \ 9121 __ret_40; \ 9122 }) 9123 #ifdef __LITTLE_ENDIAN__ 9124 #define vdup_lane_u16(__p0_41, __p1_41) __extension__ ({ \ 9125 uint16x4_t __ret_41; \ 9126 uint16x4_t __s0_41 = __p0_41; \ 9127 __ret_41 = splat_lane_u16(__s0_41, __p1_41); \ 9128 __ret_41; \ 9129 }) 9130 #else 9131 #define vdup_lane_u16(__p0_42, __p1_42) __extension__ ({ \ 9132 uint16x4_t __ret_42; \ 9133 uint16x4_t __s0_42 = __p0_42; \ 9134 uint16x4_t __rev0_42; __rev0_42 = __builtin_shufflevector(__s0_42, __s0_42, 3, 2, 1, 0); \ 9135 __ret_42 = __noswap_splat_lane_u16(__rev0_42, __p1_42); \ 9136 __ret_42 = __builtin_shufflevector(__ret_42, __ret_42, 3, 2, 1, 0); \ 9137 __ret_42; \ 9138 }) 9139 #endif 9140 9141 #ifdef __LITTLE_ENDIAN__ 9142 #define vdup_lane_s8(__p0_43, __p1_43) __extension__ ({ \ 9143 int8x8_t __ret_43; \ 9144 int8x8_t __s0_43 = __p0_43; \ 9145 __ret_43 = splat_lane_s8(__s0_43, __p1_43); \ 9146 __ret_43; \ 9147 }) 9148 #else 9149 #define vdup_lane_s8(__p0_44, __p1_44) __extension__ ({ \ 9150 int8x8_t __ret_44; \ 9151 int8x8_t __s0_44 = __p0_44; \ 9152 int8x8_t __rev0_44; __rev0_44 = __builtin_shufflevector(__s0_44, __s0_44, 7, 6, 5, 4, 3, 2, 1, 0); \ 9153 __ret_44 = __noswap_splat_lane_s8(__rev0_44, __p1_44); \ 9154 __ret_44 = __builtin_shufflevector(__ret_44, __ret_44, 7, 6, 5, 4, 3, 2, 1, 0); \ 9155 __ret_44; \ 9156 }) 9157 #endif 9158 9159 #ifdef __LITTLE_ENDIAN__ 9160 #define vdup_lane_f32(__p0_45, __p1_45) __extension__ ({ \ 9161 float32x2_t __ret_45; \ 9162 float32x2_t __s0_45 = __p0_45; \ 9163 __ret_45 = splat_lane_f32(__s0_45, __p1_45); \ 9164 __ret_45; \ 9165 }) 9166 #else 9167 #define vdup_lane_f32(__p0_46, __p1_46) __extension__ ({ \ 9168 float32x2_t __ret_46; \ 9169 float32x2_t __s0_46 = __p0_46; \ 9170 float32x2_t __rev0_46; __rev0_46 = __builtin_shufflevector(__s0_46, __s0_46, 1, 0); \ 9171 __ret_46 = __noswap_splat_lane_f32(__rev0_46, __p1_46); \ 9172 __ret_46 = __builtin_shufflevector(__ret_46, __ret_46, 1, 0); \ 9173 __ret_46; \ 9174 }) 9175 #endif 9176 9177 #ifdef __LITTLE_ENDIAN__ 9178 #define vdup_lane_f16(__p0_47, __p1_47) __extension__ ({ \ 9179 float16x4_t __ret_47; \ 9180 float16x4_t __s0_47 = __p0_47; \ 9181 __ret_47 = splat_lane_f16(__s0_47, __p1_47); \ 9182 __ret_47; \ 9183 }) 9184 #else 9185 #define vdup_lane_f16(__p0_48, __p1_48) __extension__ ({ \ 9186 float16x4_t __ret_48; \ 9187 float16x4_t __s0_48 = __p0_48; \ 9188 float16x4_t __rev0_48; __rev0_48 = __builtin_shufflevector(__s0_48, __s0_48, 3, 2, 1, 0); \ 9189 __ret_48 = __noswap_splat_lane_f16(__rev0_48, __p1_48); \ 9190 __ret_48 = __builtin_shufflevector(__ret_48, __ret_48, 3, 2, 1, 0); \ 9191 __ret_48; \ 9192 }) 9193 #endif 9194 9195 #ifdef __LITTLE_ENDIAN__ 9196 #define vdup_lane_s32(__p0_49, __p1_49) __extension__ ({ \ 9197 int32x2_t __ret_49; \ 9198 int32x2_t __s0_49 = __p0_49; \ 9199 __ret_49 = splat_lane_s32(__s0_49, __p1_49); \ 9200 __ret_49; \ 9201 }) 9202 #else 9203 #define vdup_lane_s32(__p0_50, __p1_50) __extension__ ({ \ 9204 int32x2_t __ret_50; \ 9205 int32x2_t __s0_50 = __p0_50; \ 9206 int32x2_t __rev0_50; __rev0_50 = __builtin_shufflevector(__s0_50, __s0_50, 1, 0); \ 9207 __ret_50 = __noswap_splat_lane_s32(__rev0_50, __p1_50); \ 9208 __ret_50 = __builtin_shufflevector(__ret_50, __ret_50, 1, 0); \ 9209 __ret_50; \ 9210 }) 9211 #endif 9212 9213 #define vdup_lane_s64(__p0_51, __p1_51) __extension__ ({ \ 9214 int64x1_t __ret_51; \ 9215 int64x1_t __s0_51 = __p0_51; \ 9216 __ret_51 = splat_lane_s64(__s0_51, __p1_51); \ 9217 __ret_51; \ 9218 }) 9219 #ifdef __LITTLE_ENDIAN__ 9220 #define vdup_lane_s16(__p0_52, __p1_52) __extension__ ({ \ 9221 int16x4_t __ret_52; \ 9222 int16x4_t __s0_52 = __p0_52; \ 9223 __ret_52 = splat_lane_s16(__s0_52, __p1_52); \ 9224 __ret_52; \ 9225 }) 9226 #else 9227 #define vdup_lane_s16(__p0_53, __p1_53) __extension__ ({ \ 9228 int16x4_t __ret_53; \ 9229 int16x4_t __s0_53 = __p0_53; \ 9230 int16x4_t __rev0_53; __rev0_53 = __builtin_shufflevector(__s0_53, __s0_53, 3, 2, 1, 0); \ 9231 __ret_53 = __noswap_splat_lane_s16(__rev0_53, __p1_53); \ 9232 __ret_53 = __builtin_shufflevector(__ret_53, __ret_53, 3, 2, 1, 0); \ 9233 __ret_53; \ 9234 }) 9235 #endif 9236 9237 #ifdef __LITTLE_ENDIAN__ 9238 __ai __attribute__((target("neon"))) poly8x8_t vdup_n_p8(poly8_t __p0) { 9239 poly8x8_t __ret; 9240 __ret = (poly8x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 9241 return __ret; 9242 } 9243 #else 9244 __ai __attribute__((target("neon"))) poly8x8_t vdup_n_p8(poly8_t __p0) { 9245 poly8x8_t __ret; 9246 __ret = (poly8x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 9247 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 9248 return __ret; 9249 } 9250 #endif 9251 9252 #ifdef __LITTLE_ENDIAN__ 9253 __ai __attribute__((target("neon"))) poly16x4_t vdup_n_p16(poly16_t __p0) { 9254 poly16x4_t __ret; 9255 __ret = (poly16x4_t) {__p0, __p0, __p0, __p0}; 9256 return __ret; 9257 } 9258 #else 9259 __ai __attribute__((target("neon"))) poly16x4_t vdup_n_p16(poly16_t __p0) { 9260 poly16x4_t __ret; 9261 __ret = (poly16x4_t) {__p0, __p0, __p0, __p0}; 9262 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 9263 return __ret; 9264 } 9265 #endif 9266 9267 #ifdef __LITTLE_ENDIAN__ 9268 __ai __attribute__((target("neon"))) poly8x16_t vdupq_n_p8(poly8_t __p0) { 9269 poly8x16_t __ret; 9270 __ret = (poly8x16_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 9271 return __ret; 9272 } 9273 #else 9274 __ai __attribute__((target("neon"))) poly8x16_t vdupq_n_p8(poly8_t __p0) { 9275 poly8x16_t __ret; 9276 __ret = (poly8x16_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 9277 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 9278 return __ret; 9279 } 9280 #endif 9281 9282 #ifdef __LITTLE_ENDIAN__ 9283 __ai __attribute__((target("neon"))) poly16x8_t vdupq_n_p16(poly16_t __p0) { 9284 poly16x8_t __ret; 9285 __ret = (poly16x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 9286 return __ret; 9287 } 9288 #else 9289 __ai __attribute__((target("neon"))) poly16x8_t vdupq_n_p16(poly16_t __p0) { 9290 poly16x8_t __ret; 9291 __ret = (poly16x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 9292 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 9293 return __ret; 9294 } 9295 #endif 9296 9297 #ifdef __LITTLE_ENDIAN__ 9298 __ai __attribute__((target("neon"))) uint8x16_t vdupq_n_u8(uint8_t __p0) { 9299 uint8x16_t __ret; 9300 __ret = (uint8x16_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 9301 return __ret; 9302 } 9303 #else 9304 __ai __attribute__((target("neon"))) uint8x16_t vdupq_n_u8(uint8_t __p0) { 9305 uint8x16_t __ret; 9306 __ret = (uint8x16_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 9307 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 9308 return __ret; 9309 } 9310 #endif 9311 9312 #ifdef __LITTLE_ENDIAN__ 9313 __ai __attribute__((target("neon"))) uint32x4_t vdupq_n_u32(uint32_t __p0) { 9314 uint32x4_t __ret; 9315 __ret = (uint32x4_t) {__p0, __p0, __p0, __p0}; 9316 return __ret; 9317 } 9318 #else 9319 __ai __attribute__((target("neon"))) uint32x4_t vdupq_n_u32(uint32_t __p0) { 9320 uint32x4_t __ret; 9321 __ret = (uint32x4_t) {__p0, __p0, __p0, __p0}; 9322 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 9323 return __ret; 9324 } 9325 #endif 9326 9327 #ifdef __LITTLE_ENDIAN__ 9328 __ai __attribute__((target("neon"))) uint64x2_t vdupq_n_u64(uint64_t __p0) { 9329 uint64x2_t __ret; 9330 __ret = (uint64x2_t) {__p0, __p0}; 9331 return __ret; 9332 } 9333 #else 9334 __ai __attribute__((target("neon"))) uint64x2_t vdupq_n_u64(uint64_t __p0) { 9335 uint64x2_t __ret; 9336 __ret = (uint64x2_t) {__p0, __p0}; 9337 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 9338 return __ret; 9339 } 9340 #endif 9341 9342 #ifdef __LITTLE_ENDIAN__ 9343 __ai __attribute__((target("neon"))) uint16x8_t vdupq_n_u16(uint16_t __p0) { 9344 uint16x8_t __ret; 9345 __ret = (uint16x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 9346 return __ret; 9347 } 9348 #else 9349 __ai __attribute__((target("neon"))) uint16x8_t vdupq_n_u16(uint16_t __p0) { 9350 uint16x8_t __ret; 9351 __ret = (uint16x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 9352 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 9353 return __ret; 9354 } 9355 #endif 9356 9357 #ifdef __LITTLE_ENDIAN__ 9358 __ai __attribute__((target("neon"))) int8x16_t vdupq_n_s8(int8_t __p0) { 9359 int8x16_t __ret; 9360 __ret = (int8x16_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 9361 return __ret; 9362 } 9363 #else 9364 __ai __attribute__((target("neon"))) int8x16_t vdupq_n_s8(int8_t __p0) { 9365 int8x16_t __ret; 9366 __ret = (int8x16_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 9367 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 9368 return __ret; 9369 } 9370 #endif 9371 9372 #ifdef __LITTLE_ENDIAN__ 9373 __ai __attribute__((target("neon"))) float32x4_t vdupq_n_f32(float32_t __p0) { 9374 float32x4_t __ret; 9375 __ret = (float32x4_t) {__p0, __p0, __p0, __p0}; 9376 return __ret; 9377 } 9378 #else 9379 __ai __attribute__((target("neon"))) float32x4_t vdupq_n_f32(float32_t __p0) { 9380 float32x4_t __ret; 9381 __ret = (float32x4_t) {__p0, __p0, __p0, __p0}; 9382 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 9383 return __ret; 9384 } 9385 #endif 9386 9387 #ifdef __LITTLE_ENDIAN__ 9388 #define vdupq_n_f16(__p0) __extension__ ({ \ 9389 float16x8_t __ret; \ 9390 float16_t __s0 = __p0; \ 9391 __ret = (float16x8_t) {__s0, __s0, __s0, __s0, __s0, __s0, __s0, __s0}; \ 9392 __ret; \ 9393 }) 9394 #else 9395 #define vdupq_n_f16(__p0) __extension__ ({ \ 9396 float16x8_t __ret; \ 9397 float16_t __s0 = __p0; \ 9398 __ret = (float16x8_t) {__s0, __s0, __s0, __s0, __s0, __s0, __s0, __s0}; \ 9399 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 9400 __ret; \ 9401 }) 9402 #endif 9403 9404 #ifdef __LITTLE_ENDIAN__ 9405 __ai __attribute__((target("neon"))) int32x4_t vdupq_n_s32(int32_t __p0) { 9406 int32x4_t __ret; 9407 __ret = (int32x4_t) {__p0, __p0, __p0, __p0}; 9408 return __ret; 9409 } 9410 #else 9411 __ai __attribute__((target("neon"))) int32x4_t vdupq_n_s32(int32_t __p0) { 9412 int32x4_t __ret; 9413 __ret = (int32x4_t) {__p0, __p0, __p0, __p0}; 9414 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 9415 return __ret; 9416 } 9417 #endif 9418 9419 #ifdef __LITTLE_ENDIAN__ 9420 __ai __attribute__((target("neon"))) int64x2_t vdupq_n_s64(int64_t __p0) { 9421 int64x2_t __ret; 9422 __ret = (int64x2_t) {__p0, __p0}; 9423 return __ret; 9424 } 9425 #else 9426 __ai __attribute__((target("neon"))) int64x2_t vdupq_n_s64(int64_t __p0) { 9427 int64x2_t __ret; 9428 __ret = (int64x2_t) {__p0, __p0}; 9429 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 9430 return __ret; 9431 } 9432 #endif 9433 9434 #ifdef __LITTLE_ENDIAN__ 9435 __ai __attribute__((target("neon"))) int16x8_t vdupq_n_s16(int16_t __p0) { 9436 int16x8_t __ret; 9437 __ret = (int16x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 9438 return __ret; 9439 } 9440 #else 9441 __ai __attribute__((target("neon"))) int16x8_t vdupq_n_s16(int16_t __p0) { 9442 int16x8_t __ret; 9443 __ret = (int16x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 9444 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 9445 return __ret; 9446 } 9447 #endif 9448 9449 #ifdef __LITTLE_ENDIAN__ 9450 __ai __attribute__((target("neon"))) uint8x8_t vdup_n_u8(uint8_t __p0) { 9451 uint8x8_t __ret; 9452 __ret = (uint8x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 9453 return __ret; 9454 } 9455 #else 9456 __ai __attribute__((target("neon"))) uint8x8_t vdup_n_u8(uint8_t __p0) { 9457 uint8x8_t __ret; 9458 __ret = (uint8x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 9459 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 9460 return __ret; 9461 } 9462 #endif 9463 9464 #ifdef __LITTLE_ENDIAN__ 9465 __ai __attribute__((target("neon"))) uint32x2_t vdup_n_u32(uint32_t __p0) { 9466 uint32x2_t __ret; 9467 __ret = (uint32x2_t) {__p0, __p0}; 9468 return __ret; 9469 } 9470 #else 9471 __ai __attribute__((target("neon"))) uint32x2_t vdup_n_u32(uint32_t __p0) { 9472 uint32x2_t __ret; 9473 __ret = (uint32x2_t) {__p0, __p0}; 9474 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 9475 return __ret; 9476 } 9477 #endif 9478 9479 __ai __attribute__((target("neon"))) uint64x1_t vdup_n_u64(uint64_t __p0) { 9480 uint64x1_t __ret; 9481 __ret = (uint64x1_t) {__p0}; 9482 return __ret; 9483 } 9484 #ifdef __LITTLE_ENDIAN__ 9485 __ai __attribute__((target("neon"))) uint16x4_t vdup_n_u16(uint16_t __p0) { 9486 uint16x4_t __ret; 9487 __ret = (uint16x4_t) {__p0, __p0, __p0, __p0}; 9488 return __ret; 9489 } 9490 #else 9491 __ai __attribute__((target("neon"))) uint16x4_t vdup_n_u16(uint16_t __p0) { 9492 uint16x4_t __ret; 9493 __ret = (uint16x4_t) {__p0, __p0, __p0, __p0}; 9494 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 9495 return __ret; 9496 } 9497 #endif 9498 9499 #ifdef __LITTLE_ENDIAN__ 9500 __ai __attribute__((target("neon"))) int8x8_t vdup_n_s8(int8_t __p0) { 9501 int8x8_t __ret; 9502 __ret = (int8x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 9503 return __ret; 9504 } 9505 #else 9506 __ai __attribute__((target("neon"))) int8x8_t vdup_n_s8(int8_t __p0) { 9507 int8x8_t __ret; 9508 __ret = (int8x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 9509 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 9510 return __ret; 9511 } 9512 #endif 9513 9514 #ifdef __LITTLE_ENDIAN__ 9515 __ai __attribute__((target("neon"))) float32x2_t vdup_n_f32(float32_t __p0) { 9516 float32x2_t __ret; 9517 __ret = (float32x2_t) {__p0, __p0}; 9518 return __ret; 9519 } 9520 #else 9521 __ai __attribute__((target("neon"))) float32x2_t vdup_n_f32(float32_t __p0) { 9522 float32x2_t __ret; 9523 __ret = (float32x2_t) {__p0, __p0}; 9524 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 9525 return __ret; 9526 } 9527 #endif 9528 9529 #ifdef __LITTLE_ENDIAN__ 9530 #define vdup_n_f16(__p0) __extension__ ({ \ 9531 float16x4_t __ret; \ 9532 float16_t __s0 = __p0; \ 9533 __ret = (float16x4_t) {__s0, __s0, __s0, __s0}; \ 9534 __ret; \ 9535 }) 9536 #else 9537 #define vdup_n_f16(__p0) __extension__ ({ \ 9538 float16x4_t __ret; \ 9539 float16_t __s0 = __p0; \ 9540 __ret = (float16x4_t) {__s0, __s0, __s0, __s0}; \ 9541 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 9542 __ret; \ 9543 }) 9544 #endif 9545 9546 #ifdef __LITTLE_ENDIAN__ 9547 __ai __attribute__((target("neon"))) int32x2_t vdup_n_s32(int32_t __p0) { 9548 int32x2_t __ret; 9549 __ret = (int32x2_t) {__p0, __p0}; 9550 return __ret; 9551 } 9552 #else 9553 __ai __attribute__((target("neon"))) int32x2_t vdup_n_s32(int32_t __p0) { 9554 int32x2_t __ret; 9555 __ret = (int32x2_t) {__p0, __p0}; 9556 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 9557 return __ret; 9558 } 9559 #endif 9560 9561 __ai __attribute__((target("neon"))) int64x1_t vdup_n_s64(int64_t __p0) { 9562 int64x1_t __ret; 9563 __ret = (int64x1_t) {__p0}; 9564 return __ret; 9565 } 9566 #ifdef __LITTLE_ENDIAN__ 9567 __ai __attribute__((target("neon"))) int16x4_t vdup_n_s16(int16_t __p0) { 9568 int16x4_t __ret; 9569 __ret = (int16x4_t) {__p0, __p0, __p0, __p0}; 9570 return __ret; 9571 } 9572 #else 9573 __ai __attribute__((target("neon"))) int16x4_t vdup_n_s16(int16_t __p0) { 9574 int16x4_t __ret; 9575 __ret = (int16x4_t) {__p0, __p0, __p0, __p0}; 9576 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 9577 return __ret; 9578 } 9579 #endif 9580 9581 #ifdef __LITTLE_ENDIAN__ 9582 __ai __attribute__((target("neon"))) uint8x16_t veorq_u8(uint8x16_t __p0, uint8x16_t __p1) { 9583 uint8x16_t __ret; 9584 __ret = __p0 ^ __p1; 9585 return __ret; 9586 } 9587 #else 9588 __ai __attribute__((target("neon"))) uint8x16_t veorq_u8(uint8x16_t __p0, uint8x16_t __p1) { 9589 uint8x16_t __ret; 9590 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 9591 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 9592 __ret = __rev0 ^ __rev1; 9593 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 9594 return __ret; 9595 } 9596 #endif 9597 9598 #ifdef __LITTLE_ENDIAN__ 9599 __ai __attribute__((target("neon"))) uint32x4_t veorq_u32(uint32x4_t __p0, uint32x4_t __p1) { 9600 uint32x4_t __ret; 9601 __ret = __p0 ^ __p1; 9602 return __ret; 9603 } 9604 #else 9605 __ai __attribute__((target("neon"))) uint32x4_t veorq_u32(uint32x4_t __p0, uint32x4_t __p1) { 9606 uint32x4_t __ret; 9607 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 9608 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 9609 __ret = __rev0 ^ __rev1; 9610 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 9611 return __ret; 9612 } 9613 #endif 9614 9615 #ifdef __LITTLE_ENDIAN__ 9616 __ai __attribute__((target("neon"))) uint64x2_t veorq_u64(uint64x2_t __p0, uint64x2_t __p1) { 9617 uint64x2_t __ret; 9618 __ret = __p0 ^ __p1; 9619 return __ret; 9620 } 9621 #else 9622 __ai __attribute__((target("neon"))) uint64x2_t veorq_u64(uint64x2_t __p0, uint64x2_t __p1) { 9623 uint64x2_t __ret; 9624 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 9625 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 9626 __ret = __rev0 ^ __rev1; 9627 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 9628 return __ret; 9629 } 9630 #endif 9631 9632 #ifdef __LITTLE_ENDIAN__ 9633 __ai __attribute__((target("neon"))) uint16x8_t veorq_u16(uint16x8_t __p0, uint16x8_t __p1) { 9634 uint16x8_t __ret; 9635 __ret = __p0 ^ __p1; 9636 return __ret; 9637 } 9638 #else 9639 __ai __attribute__((target("neon"))) uint16x8_t veorq_u16(uint16x8_t __p0, uint16x8_t __p1) { 9640 uint16x8_t __ret; 9641 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 9642 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 9643 __ret = __rev0 ^ __rev1; 9644 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 9645 return __ret; 9646 } 9647 #endif 9648 9649 #ifdef __LITTLE_ENDIAN__ 9650 __ai __attribute__((target("neon"))) int8x16_t veorq_s8(int8x16_t __p0, int8x16_t __p1) { 9651 int8x16_t __ret; 9652 __ret = __p0 ^ __p1; 9653 return __ret; 9654 } 9655 #else 9656 __ai __attribute__((target("neon"))) int8x16_t veorq_s8(int8x16_t __p0, int8x16_t __p1) { 9657 int8x16_t __ret; 9658 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 9659 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 9660 __ret = __rev0 ^ __rev1; 9661 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 9662 return __ret; 9663 } 9664 #endif 9665 9666 #ifdef __LITTLE_ENDIAN__ 9667 __ai __attribute__((target("neon"))) int32x4_t veorq_s32(int32x4_t __p0, int32x4_t __p1) { 9668 int32x4_t __ret; 9669 __ret = __p0 ^ __p1; 9670 return __ret; 9671 } 9672 #else 9673 __ai __attribute__((target("neon"))) int32x4_t veorq_s32(int32x4_t __p0, int32x4_t __p1) { 9674 int32x4_t __ret; 9675 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 9676 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 9677 __ret = __rev0 ^ __rev1; 9678 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 9679 return __ret; 9680 } 9681 #endif 9682 9683 #ifdef __LITTLE_ENDIAN__ 9684 __ai __attribute__((target("neon"))) int64x2_t veorq_s64(int64x2_t __p0, int64x2_t __p1) { 9685 int64x2_t __ret; 9686 __ret = __p0 ^ __p1; 9687 return __ret; 9688 } 9689 #else 9690 __ai __attribute__((target("neon"))) int64x2_t veorq_s64(int64x2_t __p0, int64x2_t __p1) { 9691 int64x2_t __ret; 9692 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 9693 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 9694 __ret = __rev0 ^ __rev1; 9695 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 9696 return __ret; 9697 } 9698 #endif 9699 9700 #ifdef __LITTLE_ENDIAN__ 9701 __ai __attribute__((target("neon"))) int16x8_t veorq_s16(int16x8_t __p0, int16x8_t __p1) { 9702 int16x8_t __ret; 9703 __ret = __p0 ^ __p1; 9704 return __ret; 9705 } 9706 #else 9707 __ai __attribute__((target("neon"))) int16x8_t veorq_s16(int16x8_t __p0, int16x8_t __p1) { 9708 int16x8_t __ret; 9709 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 9710 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 9711 __ret = __rev0 ^ __rev1; 9712 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 9713 return __ret; 9714 } 9715 #endif 9716 9717 #ifdef __LITTLE_ENDIAN__ 9718 __ai __attribute__((target("neon"))) uint8x8_t veor_u8(uint8x8_t __p0, uint8x8_t __p1) { 9719 uint8x8_t __ret; 9720 __ret = __p0 ^ __p1; 9721 return __ret; 9722 } 9723 #else 9724 __ai __attribute__((target("neon"))) uint8x8_t veor_u8(uint8x8_t __p0, uint8x8_t __p1) { 9725 uint8x8_t __ret; 9726 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 9727 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 9728 __ret = __rev0 ^ __rev1; 9729 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 9730 return __ret; 9731 } 9732 #endif 9733 9734 #ifdef __LITTLE_ENDIAN__ 9735 __ai __attribute__((target("neon"))) uint32x2_t veor_u32(uint32x2_t __p0, uint32x2_t __p1) { 9736 uint32x2_t __ret; 9737 __ret = __p0 ^ __p1; 9738 return __ret; 9739 } 9740 #else 9741 __ai __attribute__((target("neon"))) uint32x2_t veor_u32(uint32x2_t __p0, uint32x2_t __p1) { 9742 uint32x2_t __ret; 9743 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 9744 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 9745 __ret = __rev0 ^ __rev1; 9746 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 9747 return __ret; 9748 } 9749 #endif 9750 9751 __ai __attribute__((target("neon"))) uint64x1_t veor_u64(uint64x1_t __p0, uint64x1_t __p1) { 9752 uint64x1_t __ret; 9753 __ret = __p0 ^ __p1; 9754 return __ret; 9755 } 9756 #ifdef __LITTLE_ENDIAN__ 9757 __ai __attribute__((target("neon"))) uint16x4_t veor_u16(uint16x4_t __p0, uint16x4_t __p1) { 9758 uint16x4_t __ret; 9759 __ret = __p0 ^ __p1; 9760 return __ret; 9761 } 9762 #else 9763 __ai __attribute__((target("neon"))) uint16x4_t veor_u16(uint16x4_t __p0, uint16x4_t __p1) { 9764 uint16x4_t __ret; 9765 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 9766 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 9767 __ret = __rev0 ^ __rev1; 9768 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 9769 return __ret; 9770 } 9771 #endif 9772 9773 #ifdef __LITTLE_ENDIAN__ 9774 __ai __attribute__((target("neon"))) int8x8_t veor_s8(int8x8_t __p0, int8x8_t __p1) { 9775 int8x8_t __ret; 9776 __ret = __p0 ^ __p1; 9777 return __ret; 9778 } 9779 #else 9780 __ai __attribute__((target("neon"))) int8x8_t veor_s8(int8x8_t __p0, int8x8_t __p1) { 9781 int8x8_t __ret; 9782 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 9783 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 9784 __ret = __rev0 ^ __rev1; 9785 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 9786 return __ret; 9787 } 9788 #endif 9789 9790 #ifdef __LITTLE_ENDIAN__ 9791 __ai __attribute__((target("neon"))) int32x2_t veor_s32(int32x2_t __p0, int32x2_t __p1) { 9792 int32x2_t __ret; 9793 __ret = __p0 ^ __p1; 9794 return __ret; 9795 } 9796 #else 9797 __ai __attribute__((target("neon"))) int32x2_t veor_s32(int32x2_t __p0, int32x2_t __p1) { 9798 int32x2_t __ret; 9799 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 9800 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 9801 __ret = __rev0 ^ __rev1; 9802 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 9803 return __ret; 9804 } 9805 #endif 9806 9807 __ai __attribute__((target("neon"))) int64x1_t veor_s64(int64x1_t __p0, int64x1_t __p1) { 9808 int64x1_t __ret; 9809 __ret = __p0 ^ __p1; 9810 return __ret; 9811 } 9812 #ifdef __LITTLE_ENDIAN__ 9813 __ai __attribute__((target("neon"))) int16x4_t veor_s16(int16x4_t __p0, int16x4_t __p1) { 9814 int16x4_t __ret; 9815 __ret = __p0 ^ __p1; 9816 return __ret; 9817 } 9818 #else 9819 __ai __attribute__((target("neon"))) int16x4_t veor_s16(int16x4_t __p0, int16x4_t __p1) { 9820 int16x4_t __ret; 9821 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 9822 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 9823 __ret = __rev0 ^ __rev1; 9824 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 9825 return __ret; 9826 } 9827 #endif 9828 9829 #ifdef __LITTLE_ENDIAN__ 9830 #define vext_p8(__p0, __p1, __p2) __extension__ ({ \ 9831 poly8x8_t __ret; \ 9832 poly8x8_t __s0 = __p0; \ 9833 poly8x8_t __s1 = __p1; \ 9834 __ret = (poly8x8_t) __builtin_neon_vext_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 4); \ 9835 __ret; \ 9836 }) 9837 #else 9838 #define vext_p8(__p0, __p1, __p2) __extension__ ({ \ 9839 poly8x8_t __ret; \ 9840 poly8x8_t __s0 = __p0; \ 9841 poly8x8_t __s1 = __p1; \ 9842 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 9843 poly8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 9844 __ret = (poly8x8_t) __builtin_neon_vext_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 4); \ 9845 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 9846 __ret; \ 9847 }) 9848 #endif 9849 9850 #ifdef __LITTLE_ENDIAN__ 9851 #define vext_p16(__p0, __p1, __p2) __extension__ ({ \ 9852 poly16x4_t __ret; \ 9853 poly16x4_t __s0 = __p0; \ 9854 poly16x4_t __s1 = __p1; \ 9855 __ret = (poly16x4_t) __builtin_neon_vext_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 5); \ 9856 __ret; \ 9857 }) 9858 #else 9859 #define vext_p16(__p0, __p1, __p2) __extension__ ({ \ 9860 poly16x4_t __ret; \ 9861 poly16x4_t __s0 = __p0; \ 9862 poly16x4_t __s1 = __p1; \ 9863 poly16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 9864 poly16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 9865 __ret = (poly16x4_t) __builtin_neon_vext_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 5); \ 9866 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 9867 __ret; \ 9868 }) 9869 #endif 9870 9871 #ifdef __LITTLE_ENDIAN__ 9872 #define vextq_p8(__p0, __p1, __p2) __extension__ ({ \ 9873 poly8x16_t __ret; \ 9874 poly8x16_t __s0 = __p0; \ 9875 poly8x16_t __s1 = __p1; \ 9876 __ret = (poly8x16_t) __builtin_neon_vextq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 36); \ 9877 __ret; \ 9878 }) 9879 #else 9880 #define vextq_p8(__p0, __p1, __p2) __extension__ ({ \ 9881 poly8x16_t __ret; \ 9882 poly8x16_t __s0 = __p0; \ 9883 poly8x16_t __s1 = __p1; \ 9884 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 9885 poly8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 9886 __ret = (poly8x16_t) __builtin_neon_vextq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 36); \ 9887 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 9888 __ret; \ 9889 }) 9890 #endif 9891 9892 #ifdef __LITTLE_ENDIAN__ 9893 #define vextq_p16(__p0, __p1, __p2) __extension__ ({ \ 9894 poly16x8_t __ret; \ 9895 poly16x8_t __s0 = __p0; \ 9896 poly16x8_t __s1 = __p1; \ 9897 __ret = (poly16x8_t) __builtin_neon_vextq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 37); \ 9898 __ret; \ 9899 }) 9900 #else 9901 #define vextq_p16(__p0, __p1, __p2) __extension__ ({ \ 9902 poly16x8_t __ret; \ 9903 poly16x8_t __s0 = __p0; \ 9904 poly16x8_t __s1 = __p1; \ 9905 poly16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 9906 poly16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 9907 __ret = (poly16x8_t) __builtin_neon_vextq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 37); \ 9908 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 9909 __ret; \ 9910 }) 9911 #endif 9912 9913 #ifdef __LITTLE_ENDIAN__ 9914 #define vextq_u8(__p0, __p1, __p2) __extension__ ({ \ 9915 uint8x16_t __ret; \ 9916 uint8x16_t __s0 = __p0; \ 9917 uint8x16_t __s1 = __p1; \ 9918 __ret = (uint8x16_t) __builtin_neon_vextq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 48); \ 9919 __ret; \ 9920 }) 9921 #else 9922 #define vextq_u8(__p0, __p1, __p2) __extension__ ({ \ 9923 uint8x16_t __ret; \ 9924 uint8x16_t __s0 = __p0; \ 9925 uint8x16_t __s1 = __p1; \ 9926 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 9927 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 9928 __ret = (uint8x16_t) __builtin_neon_vextq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 48); \ 9929 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 9930 __ret; \ 9931 }) 9932 #endif 9933 9934 #ifdef __LITTLE_ENDIAN__ 9935 #define vextq_u32(__p0, __p1, __p2) __extension__ ({ \ 9936 uint32x4_t __ret; \ 9937 uint32x4_t __s0 = __p0; \ 9938 uint32x4_t __s1 = __p1; \ 9939 __ret = (uint32x4_t) __builtin_neon_vextq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 50); \ 9940 __ret; \ 9941 }) 9942 #else 9943 #define vextq_u32(__p0, __p1, __p2) __extension__ ({ \ 9944 uint32x4_t __ret; \ 9945 uint32x4_t __s0 = __p0; \ 9946 uint32x4_t __s1 = __p1; \ 9947 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 9948 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 9949 __ret = (uint32x4_t) __builtin_neon_vextq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 50); \ 9950 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 9951 __ret; \ 9952 }) 9953 #endif 9954 9955 #ifdef __LITTLE_ENDIAN__ 9956 #define vextq_u64(__p0, __p1, __p2) __extension__ ({ \ 9957 uint64x2_t __ret; \ 9958 uint64x2_t __s0 = __p0; \ 9959 uint64x2_t __s1 = __p1; \ 9960 __ret = (uint64x2_t) __builtin_neon_vextq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 51); \ 9961 __ret; \ 9962 }) 9963 #else 9964 #define vextq_u64(__p0, __p1, __p2) __extension__ ({ \ 9965 uint64x2_t __ret; \ 9966 uint64x2_t __s0 = __p0; \ 9967 uint64x2_t __s1 = __p1; \ 9968 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 9969 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 9970 __ret = (uint64x2_t) __builtin_neon_vextq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 51); \ 9971 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 9972 __ret; \ 9973 }) 9974 #endif 9975 9976 #ifdef __LITTLE_ENDIAN__ 9977 #define vextq_u16(__p0, __p1, __p2) __extension__ ({ \ 9978 uint16x8_t __ret; \ 9979 uint16x8_t __s0 = __p0; \ 9980 uint16x8_t __s1 = __p1; \ 9981 __ret = (uint16x8_t) __builtin_neon_vextq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 49); \ 9982 __ret; \ 9983 }) 9984 #else 9985 #define vextq_u16(__p0, __p1, __p2) __extension__ ({ \ 9986 uint16x8_t __ret; \ 9987 uint16x8_t __s0 = __p0; \ 9988 uint16x8_t __s1 = __p1; \ 9989 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 9990 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 9991 __ret = (uint16x8_t) __builtin_neon_vextq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 49); \ 9992 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 9993 __ret; \ 9994 }) 9995 #endif 9996 9997 #ifdef __LITTLE_ENDIAN__ 9998 #define vextq_s8(__p0, __p1, __p2) __extension__ ({ \ 9999 int8x16_t __ret; \ 10000 int8x16_t __s0 = __p0; \ 10001 int8x16_t __s1 = __p1; \ 10002 __ret = (int8x16_t) __builtin_neon_vextq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 32); \ 10003 __ret; \ 10004 }) 10005 #else 10006 #define vextq_s8(__p0, __p1, __p2) __extension__ ({ \ 10007 int8x16_t __ret; \ 10008 int8x16_t __s0 = __p0; \ 10009 int8x16_t __s1 = __p1; \ 10010 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 10011 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 10012 __ret = (int8x16_t) __builtin_neon_vextq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 32); \ 10013 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 10014 __ret; \ 10015 }) 10016 #endif 10017 10018 #ifdef __LITTLE_ENDIAN__ 10019 #define vextq_f32(__p0, __p1, __p2) __extension__ ({ \ 10020 float32x4_t __ret; \ 10021 float32x4_t __s0 = __p0; \ 10022 float32x4_t __s1 = __p1; \ 10023 __ret = (float32x4_t) __builtin_neon_vextq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 41); \ 10024 __ret; \ 10025 }) 10026 #else 10027 #define vextq_f32(__p0, __p1, __p2) __extension__ ({ \ 10028 float32x4_t __ret; \ 10029 float32x4_t __s0 = __p0; \ 10030 float32x4_t __s1 = __p1; \ 10031 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 10032 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 10033 __ret = (float32x4_t) __builtin_neon_vextq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 41); \ 10034 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 10035 __ret; \ 10036 }) 10037 #endif 10038 10039 #ifdef __LITTLE_ENDIAN__ 10040 #define vextq_s32(__p0, __p1, __p2) __extension__ ({ \ 10041 int32x4_t __ret; \ 10042 int32x4_t __s0 = __p0; \ 10043 int32x4_t __s1 = __p1; \ 10044 __ret = (int32x4_t) __builtin_neon_vextq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 34); \ 10045 __ret; \ 10046 }) 10047 #else 10048 #define vextq_s32(__p0, __p1, __p2) __extension__ ({ \ 10049 int32x4_t __ret; \ 10050 int32x4_t __s0 = __p0; \ 10051 int32x4_t __s1 = __p1; \ 10052 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 10053 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 10054 __ret = (int32x4_t) __builtin_neon_vextq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 34); \ 10055 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 10056 __ret; \ 10057 }) 10058 #endif 10059 10060 #ifdef __LITTLE_ENDIAN__ 10061 #define vextq_s64(__p0, __p1, __p2) __extension__ ({ \ 10062 int64x2_t __ret; \ 10063 int64x2_t __s0 = __p0; \ 10064 int64x2_t __s1 = __p1; \ 10065 __ret = (int64x2_t) __builtin_neon_vextq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 35); \ 10066 __ret; \ 10067 }) 10068 #else 10069 #define vextq_s64(__p0, __p1, __p2) __extension__ ({ \ 10070 int64x2_t __ret; \ 10071 int64x2_t __s0 = __p0; \ 10072 int64x2_t __s1 = __p1; \ 10073 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 10074 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 10075 __ret = (int64x2_t) __builtin_neon_vextq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 35); \ 10076 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 10077 __ret; \ 10078 }) 10079 #endif 10080 10081 #ifdef __LITTLE_ENDIAN__ 10082 #define vextq_s16(__p0, __p1, __p2) __extension__ ({ \ 10083 int16x8_t __ret; \ 10084 int16x8_t __s0 = __p0; \ 10085 int16x8_t __s1 = __p1; \ 10086 __ret = (int16x8_t) __builtin_neon_vextq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 33); \ 10087 __ret; \ 10088 }) 10089 #else 10090 #define vextq_s16(__p0, __p1, __p2) __extension__ ({ \ 10091 int16x8_t __ret; \ 10092 int16x8_t __s0 = __p0; \ 10093 int16x8_t __s1 = __p1; \ 10094 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 10095 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 10096 __ret = (int16x8_t) __builtin_neon_vextq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 33); \ 10097 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 10098 __ret; \ 10099 }) 10100 #endif 10101 10102 #ifdef __LITTLE_ENDIAN__ 10103 #define vext_u8(__p0, __p1, __p2) __extension__ ({ \ 10104 uint8x8_t __ret; \ 10105 uint8x8_t __s0 = __p0; \ 10106 uint8x8_t __s1 = __p1; \ 10107 __ret = (uint8x8_t) __builtin_neon_vext_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 16); \ 10108 __ret; \ 10109 }) 10110 #else 10111 #define vext_u8(__p0, __p1, __p2) __extension__ ({ \ 10112 uint8x8_t __ret; \ 10113 uint8x8_t __s0 = __p0; \ 10114 uint8x8_t __s1 = __p1; \ 10115 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 10116 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 10117 __ret = (uint8x8_t) __builtin_neon_vext_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 16); \ 10118 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 10119 __ret; \ 10120 }) 10121 #endif 10122 10123 #ifdef __LITTLE_ENDIAN__ 10124 #define vext_u32(__p0, __p1, __p2) __extension__ ({ \ 10125 uint32x2_t __ret; \ 10126 uint32x2_t __s0 = __p0; \ 10127 uint32x2_t __s1 = __p1; \ 10128 __ret = (uint32x2_t) __builtin_neon_vext_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 18); \ 10129 __ret; \ 10130 }) 10131 #else 10132 #define vext_u32(__p0, __p1, __p2) __extension__ ({ \ 10133 uint32x2_t __ret; \ 10134 uint32x2_t __s0 = __p0; \ 10135 uint32x2_t __s1 = __p1; \ 10136 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 10137 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 10138 __ret = (uint32x2_t) __builtin_neon_vext_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 18); \ 10139 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 10140 __ret; \ 10141 }) 10142 #endif 10143 10144 #define vext_u64(__p0, __p1, __p2) __extension__ ({ \ 10145 uint64x1_t __ret; \ 10146 uint64x1_t __s0 = __p0; \ 10147 uint64x1_t __s1 = __p1; \ 10148 __ret = (uint64x1_t) __builtin_neon_vext_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 19); \ 10149 __ret; \ 10150 }) 10151 #ifdef __LITTLE_ENDIAN__ 10152 #define vext_u16(__p0, __p1, __p2) __extension__ ({ \ 10153 uint16x4_t __ret; \ 10154 uint16x4_t __s0 = __p0; \ 10155 uint16x4_t __s1 = __p1; \ 10156 __ret = (uint16x4_t) __builtin_neon_vext_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 17); \ 10157 __ret; \ 10158 }) 10159 #else 10160 #define vext_u16(__p0, __p1, __p2) __extension__ ({ \ 10161 uint16x4_t __ret; \ 10162 uint16x4_t __s0 = __p0; \ 10163 uint16x4_t __s1 = __p1; \ 10164 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 10165 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 10166 __ret = (uint16x4_t) __builtin_neon_vext_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 17); \ 10167 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 10168 __ret; \ 10169 }) 10170 #endif 10171 10172 #ifdef __LITTLE_ENDIAN__ 10173 #define vext_s8(__p0, __p1, __p2) __extension__ ({ \ 10174 int8x8_t __ret; \ 10175 int8x8_t __s0 = __p0; \ 10176 int8x8_t __s1 = __p1; \ 10177 __ret = (int8x8_t) __builtin_neon_vext_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 0); \ 10178 __ret; \ 10179 }) 10180 #else 10181 #define vext_s8(__p0, __p1, __p2) __extension__ ({ \ 10182 int8x8_t __ret; \ 10183 int8x8_t __s0 = __p0; \ 10184 int8x8_t __s1 = __p1; \ 10185 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 10186 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 10187 __ret = (int8x8_t) __builtin_neon_vext_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 0); \ 10188 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 10189 __ret; \ 10190 }) 10191 #endif 10192 10193 #ifdef __LITTLE_ENDIAN__ 10194 #define vext_f32(__p0, __p1, __p2) __extension__ ({ \ 10195 float32x2_t __ret; \ 10196 float32x2_t __s0 = __p0; \ 10197 float32x2_t __s1 = __p1; \ 10198 __ret = (float32x2_t) __builtin_neon_vext_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 9); \ 10199 __ret; \ 10200 }) 10201 #else 10202 #define vext_f32(__p0, __p1, __p2) __extension__ ({ \ 10203 float32x2_t __ret; \ 10204 float32x2_t __s0 = __p0; \ 10205 float32x2_t __s1 = __p1; \ 10206 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 10207 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 10208 __ret = (float32x2_t) __builtin_neon_vext_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 9); \ 10209 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 10210 __ret; \ 10211 }) 10212 #endif 10213 10214 #ifdef __LITTLE_ENDIAN__ 10215 #define vext_s32(__p0, __p1, __p2) __extension__ ({ \ 10216 int32x2_t __ret; \ 10217 int32x2_t __s0 = __p0; \ 10218 int32x2_t __s1 = __p1; \ 10219 __ret = (int32x2_t) __builtin_neon_vext_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 2); \ 10220 __ret; \ 10221 }) 10222 #else 10223 #define vext_s32(__p0, __p1, __p2) __extension__ ({ \ 10224 int32x2_t __ret; \ 10225 int32x2_t __s0 = __p0; \ 10226 int32x2_t __s1 = __p1; \ 10227 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 10228 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 10229 __ret = (int32x2_t) __builtin_neon_vext_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 2); \ 10230 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 10231 __ret; \ 10232 }) 10233 #endif 10234 10235 #define vext_s64(__p0, __p1, __p2) __extension__ ({ \ 10236 int64x1_t __ret; \ 10237 int64x1_t __s0 = __p0; \ 10238 int64x1_t __s1 = __p1; \ 10239 __ret = (int64x1_t) __builtin_neon_vext_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 3); \ 10240 __ret; \ 10241 }) 10242 #ifdef __LITTLE_ENDIAN__ 10243 #define vext_s16(__p0, __p1, __p2) __extension__ ({ \ 10244 int16x4_t __ret; \ 10245 int16x4_t __s0 = __p0; \ 10246 int16x4_t __s1 = __p1; \ 10247 __ret = (int16x4_t) __builtin_neon_vext_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 1); \ 10248 __ret; \ 10249 }) 10250 #else 10251 #define vext_s16(__p0, __p1, __p2) __extension__ ({ \ 10252 int16x4_t __ret; \ 10253 int16x4_t __s0 = __p0; \ 10254 int16x4_t __s1 = __p1; \ 10255 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 10256 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 10257 __ret = (int16x4_t) __builtin_neon_vext_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 1); \ 10258 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 10259 __ret; \ 10260 }) 10261 #endif 10262 10263 #ifdef __LITTLE_ENDIAN__ 10264 #define vextq_f16(__p0, __p1, __p2) __extension__ ({ \ 10265 float16x8_t __ret; \ 10266 float16x8_t __s0 = __p0; \ 10267 float16x8_t __s1 = __p1; \ 10268 __ret = (float16x8_t) __builtin_neon_vextq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 40); \ 10269 __ret; \ 10270 }) 10271 #else 10272 #define vextq_f16(__p0, __p1, __p2) __extension__ ({ \ 10273 float16x8_t __ret; \ 10274 float16x8_t __s0 = __p0; \ 10275 float16x8_t __s1 = __p1; \ 10276 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 10277 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 10278 __ret = (float16x8_t) __builtin_neon_vextq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 40); \ 10279 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 10280 __ret; \ 10281 }) 10282 #endif 10283 10284 #ifdef __LITTLE_ENDIAN__ 10285 #define vext_f16(__p0, __p1, __p2) __extension__ ({ \ 10286 float16x4_t __ret; \ 10287 float16x4_t __s0 = __p0; \ 10288 float16x4_t __s1 = __p1; \ 10289 __ret = (float16x4_t) __builtin_neon_vext_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 8); \ 10290 __ret; \ 10291 }) 10292 #else 10293 #define vext_f16(__p0, __p1, __p2) __extension__ ({ \ 10294 float16x4_t __ret; \ 10295 float16x4_t __s0 = __p0; \ 10296 float16x4_t __s1 = __p1; \ 10297 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 10298 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 10299 __ret = (float16x4_t) __builtin_neon_vext_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 8); \ 10300 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 10301 __ret; \ 10302 }) 10303 #endif 10304 10305 #ifdef __LITTLE_ENDIAN__ 10306 __ai __attribute__((target("neon"))) poly8x8_t vget_high_p8(poly8x16_t __p0) { 10307 poly8x8_t __ret; 10308 __ret = __builtin_shufflevector(__p0, __p0, 8, 9, 10, 11, 12, 13, 14, 15); 10309 return __ret; 10310 } 10311 #else 10312 __ai __attribute__((target("neon"))) poly8x8_t vget_high_p8(poly8x16_t __p0) { 10313 poly8x8_t __ret; 10314 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 10315 __ret = __builtin_shufflevector(__rev0, __rev0, 8, 9, 10, 11, 12, 13, 14, 15); 10316 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 10317 return __ret; 10318 } 10319 __ai __attribute__((target("neon"))) poly8x8_t __noswap_vget_high_p8(poly8x16_t __p0) { 10320 poly8x8_t __ret; 10321 __ret = __builtin_shufflevector(__p0, __p0, 8, 9, 10, 11, 12, 13, 14, 15); 10322 return __ret; 10323 } 10324 #endif 10325 10326 #ifdef __LITTLE_ENDIAN__ 10327 __ai __attribute__((target("neon"))) poly16x4_t vget_high_p16(poly16x8_t __p0) { 10328 poly16x4_t __ret; 10329 __ret = __builtin_shufflevector(__p0, __p0, 4, 5, 6, 7); 10330 return __ret; 10331 } 10332 #else 10333 __ai __attribute__((target("neon"))) poly16x4_t vget_high_p16(poly16x8_t __p0) { 10334 poly16x4_t __ret; 10335 poly16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 10336 __ret = __builtin_shufflevector(__rev0, __rev0, 4, 5, 6, 7); 10337 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 10338 return __ret; 10339 } 10340 #endif 10341 10342 #ifdef __LITTLE_ENDIAN__ 10343 __ai __attribute__((target("neon"))) uint8x8_t vget_high_u8(uint8x16_t __p0) { 10344 uint8x8_t __ret; 10345 __ret = __builtin_shufflevector(__p0, __p0, 8, 9, 10, 11, 12, 13, 14, 15); 10346 return __ret; 10347 } 10348 #else 10349 __ai __attribute__((target("neon"))) uint8x8_t vget_high_u8(uint8x16_t __p0) { 10350 uint8x8_t __ret; 10351 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 10352 __ret = __builtin_shufflevector(__rev0, __rev0, 8, 9, 10, 11, 12, 13, 14, 15); 10353 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 10354 return __ret; 10355 } 10356 __ai __attribute__((target("neon"))) uint8x8_t __noswap_vget_high_u8(uint8x16_t __p0) { 10357 uint8x8_t __ret; 10358 __ret = __builtin_shufflevector(__p0, __p0, 8, 9, 10, 11, 12, 13, 14, 15); 10359 return __ret; 10360 } 10361 #endif 10362 10363 #ifdef __LITTLE_ENDIAN__ 10364 __ai __attribute__((target("neon"))) uint32x2_t vget_high_u32(uint32x4_t __p0) { 10365 uint32x2_t __ret; 10366 __ret = __builtin_shufflevector(__p0, __p0, 2, 3); 10367 return __ret; 10368 } 10369 #else 10370 __ai __attribute__((target("neon"))) uint32x2_t vget_high_u32(uint32x4_t __p0) { 10371 uint32x2_t __ret; 10372 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 10373 __ret = __builtin_shufflevector(__rev0, __rev0, 2, 3); 10374 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 10375 return __ret; 10376 } 10377 __ai __attribute__((target("neon"))) uint32x2_t __noswap_vget_high_u32(uint32x4_t __p0) { 10378 uint32x2_t __ret; 10379 __ret = __builtin_shufflevector(__p0, __p0, 2, 3); 10380 return __ret; 10381 } 10382 #endif 10383 10384 #ifdef __LITTLE_ENDIAN__ 10385 __ai __attribute__((target("neon"))) uint64x1_t vget_high_u64(uint64x2_t __p0) { 10386 uint64x1_t __ret; 10387 __ret = __builtin_shufflevector(__p0, __p0, 1); 10388 return __ret; 10389 } 10390 #else 10391 __ai __attribute__((target("neon"))) uint64x1_t vget_high_u64(uint64x2_t __p0) { 10392 uint64x1_t __ret; 10393 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 10394 __ret = __builtin_shufflevector(__rev0, __rev0, 1); 10395 return __ret; 10396 } 10397 #endif 10398 10399 #ifdef __LITTLE_ENDIAN__ 10400 __ai __attribute__((target("neon"))) uint16x4_t vget_high_u16(uint16x8_t __p0) { 10401 uint16x4_t __ret; 10402 __ret = __builtin_shufflevector(__p0, __p0, 4, 5, 6, 7); 10403 return __ret; 10404 } 10405 #else 10406 __ai __attribute__((target("neon"))) uint16x4_t vget_high_u16(uint16x8_t __p0) { 10407 uint16x4_t __ret; 10408 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 10409 __ret = __builtin_shufflevector(__rev0, __rev0, 4, 5, 6, 7); 10410 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 10411 return __ret; 10412 } 10413 __ai __attribute__((target("neon"))) uint16x4_t __noswap_vget_high_u16(uint16x8_t __p0) { 10414 uint16x4_t __ret; 10415 __ret = __builtin_shufflevector(__p0, __p0, 4, 5, 6, 7); 10416 return __ret; 10417 } 10418 #endif 10419 10420 #ifdef __LITTLE_ENDIAN__ 10421 __ai __attribute__((target("neon"))) int8x8_t vget_high_s8(int8x16_t __p0) { 10422 int8x8_t __ret; 10423 __ret = __builtin_shufflevector(__p0, __p0, 8, 9, 10, 11, 12, 13, 14, 15); 10424 return __ret; 10425 } 10426 #else 10427 __ai __attribute__((target("neon"))) int8x8_t vget_high_s8(int8x16_t __p0) { 10428 int8x8_t __ret; 10429 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 10430 __ret = __builtin_shufflevector(__rev0, __rev0, 8, 9, 10, 11, 12, 13, 14, 15); 10431 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 10432 return __ret; 10433 } 10434 __ai __attribute__((target("neon"))) int8x8_t __noswap_vget_high_s8(int8x16_t __p0) { 10435 int8x8_t __ret; 10436 __ret = __builtin_shufflevector(__p0, __p0, 8, 9, 10, 11, 12, 13, 14, 15); 10437 return __ret; 10438 } 10439 #endif 10440 10441 #ifdef __LITTLE_ENDIAN__ 10442 __ai __attribute__((target("neon"))) float32x2_t vget_high_f32(float32x4_t __p0) { 10443 float32x2_t __ret; 10444 __ret = __builtin_shufflevector(__p0, __p0, 2, 3); 10445 return __ret; 10446 } 10447 #else 10448 __ai __attribute__((target("neon"))) float32x2_t vget_high_f32(float32x4_t __p0) { 10449 float32x2_t __ret; 10450 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 10451 __ret = __builtin_shufflevector(__rev0, __rev0, 2, 3); 10452 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 10453 return __ret; 10454 } 10455 __ai __attribute__((target("neon"))) float32x2_t __noswap_vget_high_f32(float32x4_t __p0) { 10456 float32x2_t __ret; 10457 __ret = __builtin_shufflevector(__p0, __p0, 2, 3); 10458 return __ret; 10459 } 10460 #endif 10461 10462 #ifdef __LITTLE_ENDIAN__ 10463 __ai __attribute__((target("neon"))) float16x4_t vget_high_f16(float16x8_t __p0) { 10464 float16x4_t __ret; 10465 __ret = __builtin_shufflevector(__p0, __p0, 4, 5, 6, 7); 10466 return __ret; 10467 } 10468 #else 10469 __ai __attribute__((target("neon"))) float16x4_t vget_high_f16(float16x8_t __p0) { 10470 float16x4_t __ret; 10471 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 10472 __ret = __builtin_shufflevector(__rev0, __rev0, 4, 5, 6, 7); 10473 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 10474 return __ret; 10475 } 10476 __ai __attribute__((target("neon"))) float16x4_t __noswap_vget_high_f16(float16x8_t __p0) { 10477 float16x4_t __ret; 10478 __ret = __builtin_shufflevector(__p0, __p0, 4, 5, 6, 7); 10479 return __ret; 10480 } 10481 #endif 10482 10483 #ifdef __LITTLE_ENDIAN__ 10484 __ai __attribute__((target("neon"))) int32x2_t vget_high_s32(int32x4_t __p0) { 10485 int32x2_t __ret; 10486 __ret = __builtin_shufflevector(__p0, __p0, 2, 3); 10487 return __ret; 10488 } 10489 #else 10490 __ai __attribute__((target("neon"))) int32x2_t vget_high_s32(int32x4_t __p0) { 10491 int32x2_t __ret; 10492 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 10493 __ret = __builtin_shufflevector(__rev0, __rev0, 2, 3); 10494 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 10495 return __ret; 10496 } 10497 __ai __attribute__((target("neon"))) int32x2_t __noswap_vget_high_s32(int32x4_t __p0) { 10498 int32x2_t __ret; 10499 __ret = __builtin_shufflevector(__p0, __p0, 2, 3); 10500 return __ret; 10501 } 10502 #endif 10503 10504 #ifdef __LITTLE_ENDIAN__ 10505 __ai __attribute__((target("neon"))) int64x1_t vget_high_s64(int64x2_t __p0) { 10506 int64x1_t __ret; 10507 __ret = __builtin_shufflevector(__p0, __p0, 1); 10508 return __ret; 10509 } 10510 #else 10511 __ai __attribute__((target("neon"))) int64x1_t vget_high_s64(int64x2_t __p0) { 10512 int64x1_t __ret; 10513 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 10514 __ret = __builtin_shufflevector(__rev0, __rev0, 1); 10515 return __ret; 10516 } 10517 #endif 10518 10519 #ifdef __LITTLE_ENDIAN__ 10520 __ai __attribute__((target("neon"))) int16x4_t vget_high_s16(int16x8_t __p0) { 10521 int16x4_t __ret; 10522 __ret = __builtin_shufflevector(__p0, __p0, 4, 5, 6, 7); 10523 return __ret; 10524 } 10525 #else 10526 __ai __attribute__((target("neon"))) int16x4_t vget_high_s16(int16x8_t __p0) { 10527 int16x4_t __ret; 10528 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 10529 __ret = __builtin_shufflevector(__rev0, __rev0, 4, 5, 6, 7); 10530 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 10531 return __ret; 10532 } 10533 __ai __attribute__((target("neon"))) int16x4_t __noswap_vget_high_s16(int16x8_t __p0) { 10534 int16x4_t __ret; 10535 __ret = __builtin_shufflevector(__p0, __p0, 4, 5, 6, 7); 10536 return __ret; 10537 } 10538 #endif 10539 10540 #ifdef __LITTLE_ENDIAN__ 10541 #define vget_lane_p8(__p0, __p1) __extension__ ({ \ 10542 poly8_t __ret; \ 10543 poly8x8_t __s0 = __p0; \ 10544 __ret = (poly8_t) __builtin_neon_vget_lane_i8((poly8x8_t)__s0, __p1); \ 10545 __ret; \ 10546 }) 10547 #else 10548 #define vget_lane_p8(__p0, __p1) __extension__ ({ \ 10549 poly8_t __ret; \ 10550 poly8x8_t __s0 = __p0; \ 10551 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 10552 __ret = (poly8_t) __builtin_neon_vget_lane_i8((poly8x8_t)__rev0, __p1); \ 10553 __ret; \ 10554 }) 10555 #define __noswap_vget_lane_p8(__p0, __p1) __extension__ ({ \ 10556 poly8_t __ret; \ 10557 poly8x8_t __s0 = __p0; \ 10558 __ret = (poly8_t) __builtin_neon_vget_lane_i8((poly8x8_t)__s0, __p1); \ 10559 __ret; \ 10560 }) 10561 #endif 10562 10563 #ifdef __LITTLE_ENDIAN__ 10564 #define vget_lane_p16(__p0, __p1) __extension__ ({ \ 10565 poly16_t __ret; \ 10566 poly16x4_t __s0 = __p0; \ 10567 __ret = (poly16_t) __builtin_neon_vget_lane_i16((poly16x4_t)__s0, __p1); \ 10568 __ret; \ 10569 }) 10570 #else 10571 #define vget_lane_p16(__p0, __p1) __extension__ ({ \ 10572 poly16_t __ret; \ 10573 poly16x4_t __s0 = __p0; \ 10574 poly16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 10575 __ret = (poly16_t) __builtin_neon_vget_lane_i16((poly16x4_t)__rev0, __p1); \ 10576 __ret; \ 10577 }) 10578 #define __noswap_vget_lane_p16(__p0, __p1) __extension__ ({ \ 10579 poly16_t __ret; \ 10580 poly16x4_t __s0 = __p0; \ 10581 __ret = (poly16_t) __builtin_neon_vget_lane_i16((poly16x4_t)__s0, __p1); \ 10582 __ret; \ 10583 }) 10584 #endif 10585 10586 #ifdef __LITTLE_ENDIAN__ 10587 #define vgetq_lane_p8(__p0, __p1) __extension__ ({ \ 10588 poly8_t __ret; \ 10589 poly8x16_t __s0 = __p0; \ 10590 __ret = (poly8_t) __builtin_neon_vgetq_lane_i8((poly8x16_t)__s0, __p1); \ 10591 __ret; \ 10592 }) 10593 #else 10594 #define vgetq_lane_p8(__p0, __p1) __extension__ ({ \ 10595 poly8_t __ret; \ 10596 poly8x16_t __s0 = __p0; \ 10597 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 10598 __ret = (poly8_t) __builtin_neon_vgetq_lane_i8((poly8x16_t)__rev0, __p1); \ 10599 __ret; \ 10600 }) 10601 #define __noswap_vgetq_lane_p8(__p0, __p1) __extension__ ({ \ 10602 poly8_t __ret; \ 10603 poly8x16_t __s0 = __p0; \ 10604 __ret = (poly8_t) __builtin_neon_vgetq_lane_i8((poly8x16_t)__s0, __p1); \ 10605 __ret; \ 10606 }) 10607 #endif 10608 10609 #ifdef __LITTLE_ENDIAN__ 10610 #define vgetq_lane_p16(__p0, __p1) __extension__ ({ \ 10611 poly16_t __ret; \ 10612 poly16x8_t __s0 = __p0; \ 10613 __ret = (poly16_t) __builtin_neon_vgetq_lane_i16((poly16x8_t)__s0, __p1); \ 10614 __ret; \ 10615 }) 10616 #else 10617 #define vgetq_lane_p16(__p0, __p1) __extension__ ({ \ 10618 poly16_t __ret; \ 10619 poly16x8_t __s0 = __p0; \ 10620 poly16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 10621 __ret = (poly16_t) __builtin_neon_vgetq_lane_i16((poly16x8_t)__rev0, __p1); \ 10622 __ret; \ 10623 }) 10624 #define __noswap_vgetq_lane_p16(__p0, __p1) __extension__ ({ \ 10625 poly16_t __ret; \ 10626 poly16x8_t __s0 = __p0; \ 10627 __ret = (poly16_t) __builtin_neon_vgetq_lane_i16((poly16x8_t)__s0, __p1); \ 10628 __ret; \ 10629 }) 10630 #endif 10631 10632 #ifdef __LITTLE_ENDIAN__ 10633 #define vgetq_lane_u8(__p0, __p1) __extension__ ({ \ 10634 uint8_t __ret; \ 10635 uint8x16_t __s0 = __p0; \ 10636 __ret = (uint8_t) __builtin_neon_vgetq_lane_i8((int8x16_t)__s0, __p1); \ 10637 __ret; \ 10638 }) 10639 #else 10640 #define vgetq_lane_u8(__p0, __p1) __extension__ ({ \ 10641 uint8_t __ret; \ 10642 uint8x16_t __s0 = __p0; \ 10643 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 10644 __ret = (uint8_t) __builtin_neon_vgetq_lane_i8((int8x16_t)__rev0, __p1); \ 10645 __ret; \ 10646 }) 10647 #define __noswap_vgetq_lane_u8(__p0, __p1) __extension__ ({ \ 10648 uint8_t __ret; \ 10649 uint8x16_t __s0 = __p0; \ 10650 __ret = (uint8_t) __builtin_neon_vgetq_lane_i8((int8x16_t)__s0, __p1); \ 10651 __ret; \ 10652 }) 10653 #endif 10654 10655 #ifdef __LITTLE_ENDIAN__ 10656 #define vgetq_lane_u32(__p0, __p1) __extension__ ({ \ 10657 uint32_t __ret; \ 10658 uint32x4_t __s0 = __p0; \ 10659 __ret = (uint32_t) __builtin_neon_vgetq_lane_i32((int32x4_t)__s0, __p1); \ 10660 __ret; \ 10661 }) 10662 #else 10663 #define vgetq_lane_u32(__p0, __p1) __extension__ ({ \ 10664 uint32_t __ret; \ 10665 uint32x4_t __s0 = __p0; \ 10666 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 10667 __ret = (uint32_t) __builtin_neon_vgetq_lane_i32((int32x4_t)__rev0, __p1); \ 10668 __ret; \ 10669 }) 10670 #define __noswap_vgetq_lane_u32(__p0, __p1) __extension__ ({ \ 10671 uint32_t __ret; \ 10672 uint32x4_t __s0 = __p0; \ 10673 __ret = (uint32_t) __builtin_neon_vgetq_lane_i32((int32x4_t)__s0, __p1); \ 10674 __ret; \ 10675 }) 10676 #endif 10677 10678 #ifdef __LITTLE_ENDIAN__ 10679 #define vgetq_lane_u64(__p0, __p1) __extension__ ({ \ 10680 uint64_t __ret; \ 10681 uint64x2_t __s0 = __p0; \ 10682 __ret = (uint64_t) __builtin_neon_vgetq_lane_i64((int64x2_t)__s0, __p1); \ 10683 __ret; \ 10684 }) 10685 #else 10686 #define vgetq_lane_u64(__p0, __p1) __extension__ ({ \ 10687 uint64_t __ret; \ 10688 uint64x2_t __s0 = __p0; \ 10689 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 10690 __ret = (uint64_t) __builtin_neon_vgetq_lane_i64((int64x2_t)__rev0, __p1); \ 10691 __ret; \ 10692 }) 10693 #define __noswap_vgetq_lane_u64(__p0, __p1) __extension__ ({ \ 10694 uint64_t __ret; \ 10695 uint64x2_t __s0 = __p0; \ 10696 __ret = (uint64_t) __builtin_neon_vgetq_lane_i64((int64x2_t)__s0, __p1); \ 10697 __ret; \ 10698 }) 10699 #endif 10700 10701 #ifdef __LITTLE_ENDIAN__ 10702 #define vgetq_lane_u16(__p0, __p1) __extension__ ({ \ 10703 uint16_t __ret; \ 10704 uint16x8_t __s0 = __p0; \ 10705 __ret = (uint16_t) __builtin_neon_vgetq_lane_i16((int16x8_t)__s0, __p1); \ 10706 __ret; \ 10707 }) 10708 #else 10709 #define vgetq_lane_u16(__p0, __p1) __extension__ ({ \ 10710 uint16_t __ret; \ 10711 uint16x8_t __s0 = __p0; \ 10712 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 10713 __ret = (uint16_t) __builtin_neon_vgetq_lane_i16((int16x8_t)__rev0, __p1); \ 10714 __ret; \ 10715 }) 10716 #define __noswap_vgetq_lane_u16(__p0, __p1) __extension__ ({ \ 10717 uint16_t __ret; \ 10718 uint16x8_t __s0 = __p0; \ 10719 __ret = (uint16_t) __builtin_neon_vgetq_lane_i16((int16x8_t)__s0, __p1); \ 10720 __ret; \ 10721 }) 10722 #endif 10723 10724 #ifdef __LITTLE_ENDIAN__ 10725 #define vgetq_lane_s8(__p0, __p1) __extension__ ({ \ 10726 int8_t __ret; \ 10727 int8x16_t __s0 = __p0; \ 10728 __ret = (int8_t) __builtin_neon_vgetq_lane_i8((int8x16_t)__s0, __p1); \ 10729 __ret; \ 10730 }) 10731 #else 10732 #define vgetq_lane_s8(__p0, __p1) __extension__ ({ \ 10733 int8_t __ret; \ 10734 int8x16_t __s0 = __p0; \ 10735 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 10736 __ret = (int8_t) __builtin_neon_vgetq_lane_i8((int8x16_t)__rev0, __p1); \ 10737 __ret; \ 10738 }) 10739 #define __noswap_vgetq_lane_s8(__p0, __p1) __extension__ ({ \ 10740 int8_t __ret; \ 10741 int8x16_t __s0 = __p0; \ 10742 __ret = (int8_t) __builtin_neon_vgetq_lane_i8((int8x16_t)__s0, __p1); \ 10743 __ret; \ 10744 }) 10745 #endif 10746 10747 #ifdef __LITTLE_ENDIAN__ 10748 #define vgetq_lane_f32(__p0, __p1) __extension__ ({ \ 10749 float32_t __ret; \ 10750 float32x4_t __s0 = __p0; \ 10751 __ret = (float32_t) __builtin_neon_vgetq_lane_f32((float32x4_t)__s0, __p1); \ 10752 __ret; \ 10753 }) 10754 #else 10755 #define vgetq_lane_f32(__p0, __p1) __extension__ ({ \ 10756 float32_t __ret; \ 10757 float32x4_t __s0 = __p0; \ 10758 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 10759 __ret = (float32_t) __builtin_neon_vgetq_lane_f32((float32x4_t)__rev0, __p1); \ 10760 __ret; \ 10761 }) 10762 #define __noswap_vgetq_lane_f32(__p0, __p1) __extension__ ({ \ 10763 float32_t __ret; \ 10764 float32x4_t __s0 = __p0; \ 10765 __ret = (float32_t) __builtin_neon_vgetq_lane_f32((float32x4_t)__s0, __p1); \ 10766 __ret; \ 10767 }) 10768 #endif 10769 10770 #ifdef __LITTLE_ENDIAN__ 10771 #define vgetq_lane_s32(__p0, __p1) __extension__ ({ \ 10772 int32_t __ret; \ 10773 int32x4_t __s0 = __p0; \ 10774 __ret = (int32_t) __builtin_neon_vgetq_lane_i32((int32x4_t)__s0, __p1); \ 10775 __ret; \ 10776 }) 10777 #else 10778 #define vgetq_lane_s32(__p0, __p1) __extension__ ({ \ 10779 int32_t __ret; \ 10780 int32x4_t __s0 = __p0; \ 10781 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 10782 __ret = (int32_t) __builtin_neon_vgetq_lane_i32((int32x4_t)__rev0, __p1); \ 10783 __ret; \ 10784 }) 10785 #define __noswap_vgetq_lane_s32(__p0, __p1) __extension__ ({ \ 10786 int32_t __ret; \ 10787 int32x4_t __s0 = __p0; \ 10788 __ret = (int32_t) __builtin_neon_vgetq_lane_i32((int32x4_t)__s0, __p1); \ 10789 __ret; \ 10790 }) 10791 #endif 10792 10793 #ifdef __LITTLE_ENDIAN__ 10794 #define vgetq_lane_s64(__p0, __p1) __extension__ ({ \ 10795 int64_t __ret; \ 10796 int64x2_t __s0 = __p0; \ 10797 __ret = (int64_t) __builtin_neon_vgetq_lane_i64((int64x2_t)__s0, __p1); \ 10798 __ret; \ 10799 }) 10800 #else 10801 #define vgetq_lane_s64(__p0, __p1) __extension__ ({ \ 10802 int64_t __ret; \ 10803 int64x2_t __s0 = __p0; \ 10804 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 10805 __ret = (int64_t) __builtin_neon_vgetq_lane_i64((int64x2_t)__rev0, __p1); \ 10806 __ret; \ 10807 }) 10808 #define __noswap_vgetq_lane_s64(__p0, __p1) __extension__ ({ \ 10809 int64_t __ret; \ 10810 int64x2_t __s0 = __p0; \ 10811 __ret = (int64_t) __builtin_neon_vgetq_lane_i64((int64x2_t)__s0, __p1); \ 10812 __ret; \ 10813 }) 10814 #endif 10815 10816 #ifdef __LITTLE_ENDIAN__ 10817 #define vgetq_lane_s16(__p0, __p1) __extension__ ({ \ 10818 int16_t __ret; \ 10819 int16x8_t __s0 = __p0; \ 10820 __ret = (int16_t) __builtin_neon_vgetq_lane_i16((int16x8_t)__s0, __p1); \ 10821 __ret; \ 10822 }) 10823 #else 10824 #define vgetq_lane_s16(__p0, __p1) __extension__ ({ \ 10825 int16_t __ret; \ 10826 int16x8_t __s0 = __p0; \ 10827 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 10828 __ret = (int16_t) __builtin_neon_vgetq_lane_i16((int16x8_t)__rev0, __p1); \ 10829 __ret; \ 10830 }) 10831 #define __noswap_vgetq_lane_s16(__p0, __p1) __extension__ ({ \ 10832 int16_t __ret; \ 10833 int16x8_t __s0 = __p0; \ 10834 __ret = (int16_t) __builtin_neon_vgetq_lane_i16((int16x8_t)__s0, __p1); \ 10835 __ret; \ 10836 }) 10837 #endif 10838 10839 #ifdef __LITTLE_ENDIAN__ 10840 #define vget_lane_u8(__p0, __p1) __extension__ ({ \ 10841 uint8_t __ret; \ 10842 uint8x8_t __s0 = __p0; \ 10843 __ret = (uint8_t) __builtin_neon_vget_lane_i8((int8x8_t)__s0, __p1); \ 10844 __ret; \ 10845 }) 10846 #else 10847 #define vget_lane_u8(__p0, __p1) __extension__ ({ \ 10848 uint8_t __ret; \ 10849 uint8x8_t __s0 = __p0; \ 10850 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 10851 __ret = (uint8_t) __builtin_neon_vget_lane_i8((int8x8_t)__rev0, __p1); \ 10852 __ret; \ 10853 }) 10854 #define __noswap_vget_lane_u8(__p0, __p1) __extension__ ({ \ 10855 uint8_t __ret; \ 10856 uint8x8_t __s0 = __p0; \ 10857 __ret = (uint8_t) __builtin_neon_vget_lane_i8((int8x8_t)__s0, __p1); \ 10858 __ret; \ 10859 }) 10860 #endif 10861 10862 #ifdef __LITTLE_ENDIAN__ 10863 #define vget_lane_u32(__p0, __p1) __extension__ ({ \ 10864 uint32_t __ret; \ 10865 uint32x2_t __s0 = __p0; \ 10866 __ret = (uint32_t) __builtin_neon_vget_lane_i32((int32x2_t)__s0, __p1); \ 10867 __ret; \ 10868 }) 10869 #else 10870 #define vget_lane_u32(__p0, __p1) __extension__ ({ \ 10871 uint32_t __ret; \ 10872 uint32x2_t __s0 = __p0; \ 10873 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 10874 __ret = (uint32_t) __builtin_neon_vget_lane_i32((int32x2_t)__rev0, __p1); \ 10875 __ret; \ 10876 }) 10877 #define __noswap_vget_lane_u32(__p0, __p1) __extension__ ({ \ 10878 uint32_t __ret; \ 10879 uint32x2_t __s0 = __p0; \ 10880 __ret = (uint32_t) __builtin_neon_vget_lane_i32((int32x2_t)__s0, __p1); \ 10881 __ret; \ 10882 }) 10883 #endif 10884 10885 #define vget_lane_u64(__p0, __p1) __extension__ ({ \ 10886 uint64_t __ret; \ 10887 uint64x1_t __s0 = __p0; \ 10888 __ret = (uint64_t) __builtin_neon_vget_lane_i64((int64x1_t)__s0, __p1); \ 10889 __ret; \ 10890 }) 10891 #ifdef __LITTLE_ENDIAN__ 10892 #define vget_lane_u16(__p0, __p1) __extension__ ({ \ 10893 uint16_t __ret; \ 10894 uint16x4_t __s0 = __p0; \ 10895 __ret = (uint16_t) __builtin_neon_vget_lane_i16((int16x4_t)__s0, __p1); \ 10896 __ret; \ 10897 }) 10898 #else 10899 #define vget_lane_u16(__p0, __p1) __extension__ ({ \ 10900 uint16_t __ret; \ 10901 uint16x4_t __s0 = __p0; \ 10902 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 10903 __ret = (uint16_t) __builtin_neon_vget_lane_i16((int16x4_t)__rev0, __p1); \ 10904 __ret; \ 10905 }) 10906 #define __noswap_vget_lane_u16(__p0, __p1) __extension__ ({ \ 10907 uint16_t __ret; \ 10908 uint16x4_t __s0 = __p0; \ 10909 __ret = (uint16_t) __builtin_neon_vget_lane_i16((int16x4_t)__s0, __p1); \ 10910 __ret; \ 10911 }) 10912 #endif 10913 10914 #ifdef __LITTLE_ENDIAN__ 10915 #define vget_lane_s8(__p0, __p1) __extension__ ({ \ 10916 int8_t __ret; \ 10917 int8x8_t __s0 = __p0; \ 10918 __ret = (int8_t) __builtin_neon_vget_lane_i8((int8x8_t)__s0, __p1); \ 10919 __ret; \ 10920 }) 10921 #else 10922 #define vget_lane_s8(__p0, __p1) __extension__ ({ \ 10923 int8_t __ret; \ 10924 int8x8_t __s0 = __p0; \ 10925 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 10926 __ret = (int8_t) __builtin_neon_vget_lane_i8((int8x8_t)__rev0, __p1); \ 10927 __ret; \ 10928 }) 10929 #define __noswap_vget_lane_s8(__p0, __p1) __extension__ ({ \ 10930 int8_t __ret; \ 10931 int8x8_t __s0 = __p0; \ 10932 __ret = (int8_t) __builtin_neon_vget_lane_i8((int8x8_t)__s0, __p1); \ 10933 __ret; \ 10934 }) 10935 #endif 10936 10937 #ifdef __LITTLE_ENDIAN__ 10938 #define vget_lane_f32(__p0, __p1) __extension__ ({ \ 10939 float32_t __ret; \ 10940 float32x2_t __s0 = __p0; \ 10941 __ret = (float32_t) __builtin_neon_vget_lane_f32((float32x2_t)__s0, __p1); \ 10942 __ret; \ 10943 }) 10944 #else 10945 #define vget_lane_f32(__p0, __p1) __extension__ ({ \ 10946 float32_t __ret; \ 10947 float32x2_t __s0 = __p0; \ 10948 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 10949 __ret = (float32_t) __builtin_neon_vget_lane_f32((float32x2_t)__rev0, __p1); \ 10950 __ret; \ 10951 }) 10952 #define __noswap_vget_lane_f32(__p0, __p1) __extension__ ({ \ 10953 float32_t __ret; \ 10954 float32x2_t __s0 = __p0; \ 10955 __ret = (float32_t) __builtin_neon_vget_lane_f32((float32x2_t)__s0, __p1); \ 10956 __ret; \ 10957 }) 10958 #endif 10959 10960 #ifdef __LITTLE_ENDIAN__ 10961 #define vget_lane_s32(__p0, __p1) __extension__ ({ \ 10962 int32_t __ret; \ 10963 int32x2_t __s0 = __p0; \ 10964 __ret = (int32_t) __builtin_neon_vget_lane_i32((int32x2_t)__s0, __p1); \ 10965 __ret; \ 10966 }) 10967 #else 10968 #define vget_lane_s32(__p0, __p1) __extension__ ({ \ 10969 int32_t __ret; \ 10970 int32x2_t __s0 = __p0; \ 10971 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 10972 __ret = (int32_t) __builtin_neon_vget_lane_i32((int32x2_t)__rev0, __p1); \ 10973 __ret; \ 10974 }) 10975 #define __noswap_vget_lane_s32(__p0, __p1) __extension__ ({ \ 10976 int32_t __ret; \ 10977 int32x2_t __s0 = __p0; \ 10978 __ret = (int32_t) __builtin_neon_vget_lane_i32((int32x2_t)__s0, __p1); \ 10979 __ret; \ 10980 }) 10981 #endif 10982 10983 #define vget_lane_s64(__p0, __p1) __extension__ ({ \ 10984 int64_t __ret; \ 10985 int64x1_t __s0 = __p0; \ 10986 __ret = (int64_t) __builtin_neon_vget_lane_i64((int64x1_t)__s0, __p1); \ 10987 __ret; \ 10988 }) 10989 #ifdef __LITTLE_ENDIAN__ 10990 #define vget_lane_s16(__p0, __p1) __extension__ ({ \ 10991 int16_t __ret; \ 10992 int16x4_t __s0 = __p0; \ 10993 __ret = (int16_t) __builtin_neon_vget_lane_i16((int16x4_t)__s0, __p1); \ 10994 __ret; \ 10995 }) 10996 #else 10997 #define vget_lane_s16(__p0, __p1) __extension__ ({ \ 10998 int16_t __ret; \ 10999 int16x4_t __s0 = __p0; \ 11000 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 11001 __ret = (int16_t) __builtin_neon_vget_lane_i16((int16x4_t)__rev0, __p1); \ 11002 __ret; \ 11003 }) 11004 #define __noswap_vget_lane_s16(__p0, __p1) __extension__ ({ \ 11005 int16_t __ret; \ 11006 int16x4_t __s0 = __p0; \ 11007 __ret = (int16_t) __builtin_neon_vget_lane_i16((int16x4_t)__s0, __p1); \ 11008 __ret; \ 11009 }) 11010 #endif 11011 11012 #ifdef __LITTLE_ENDIAN__ 11013 __ai __attribute__((target("neon"))) poly8x8_t vget_low_p8(poly8x16_t __p0) { 11014 poly8x8_t __ret; 11015 __ret = __builtin_shufflevector(__p0, __p0, 0, 1, 2, 3, 4, 5, 6, 7); 11016 return __ret; 11017 } 11018 #else 11019 __ai __attribute__((target("neon"))) poly8x8_t vget_low_p8(poly8x16_t __p0) { 11020 poly8x8_t __ret; 11021 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 11022 __ret = __builtin_shufflevector(__rev0, __rev0, 0, 1, 2, 3, 4, 5, 6, 7); 11023 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 11024 return __ret; 11025 } 11026 #endif 11027 11028 #ifdef __LITTLE_ENDIAN__ 11029 __ai __attribute__((target("neon"))) poly16x4_t vget_low_p16(poly16x8_t __p0) { 11030 poly16x4_t __ret; 11031 __ret = __builtin_shufflevector(__p0, __p0, 0, 1, 2, 3); 11032 return __ret; 11033 } 11034 #else 11035 __ai __attribute__((target("neon"))) poly16x4_t vget_low_p16(poly16x8_t __p0) { 11036 poly16x4_t __ret; 11037 poly16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 11038 __ret = __builtin_shufflevector(__rev0, __rev0, 0, 1, 2, 3); 11039 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 11040 return __ret; 11041 } 11042 #endif 11043 11044 #ifdef __LITTLE_ENDIAN__ 11045 __ai __attribute__((target("neon"))) uint8x8_t vget_low_u8(uint8x16_t __p0) { 11046 uint8x8_t __ret; 11047 __ret = __builtin_shufflevector(__p0, __p0, 0, 1, 2, 3, 4, 5, 6, 7); 11048 return __ret; 11049 } 11050 #else 11051 __ai __attribute__((target("neon"))) uint8x8_t vget_low_u8(uint8x16_t __p0) { 11052 uint8x8_t __ret; 11053 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 11054 __ret = __builtin_shufflevector(__rev0, __rev0, 0, 1, 2, 3, 4, 5, 6, 7); 11055 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 11056 return __ret; 11057 } 11058 #endif 11059 11060 #ifdef __LITTLE_ENDIAN__ 11061 __ai __attribute__((target("neon"))) uint32x2_t vget_low_u32(uint32x4_t __p0) { 11062 uint32x2_t __ret; 11063 __ret = __builtin_shufflevector(__p0, __p0, 0, 1); 11064 return __ret; 11065 } 11066 #else 11067 __ai __attribute__((target("neon"))) uint32x2_t vget_low_u32(uint32x4_t __p0) { 11068 uint32x2_t __ret; 11069 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 11070 __ret = __builtin_shufflevector(__rev0, __rev0, 0, 1); 11071 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 11072 return __ret; 11073 } 11074 #endif 11075 11076 #ifdef __LITTLE_ENDIAN__ 11077 __ai __attribute__((target("neon"))) uint64x1_t vget_low_u64(uint64x2_t __p0) { 11078 uint64x1_t __ret; 11079 __ret = __builtin_shufflevector(__p0, __p0, 0); 11080 return __ret; 11081 } 11082 #else 11083 __ai __attribute__((target("neon"))) uint64x1_t vget_low_u64(uint64x2_t __p0) { 11084 uint64x1_t __ret; 11085 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 11086 __ret = __builtin_shufflevector(__rev0, __rev0, 0); 11087 return __ret; 11088 } 11089 #endif 11090 11091 #ifdef __LITTLE_ENDIAN__ 11092 __ai __attribute__((target("neon"))) uint16x4_t vget_low_u16(uint16x8_t __p0) { 11093 uint16x4_t __ret; 11094 __ret = __builtin_shufflevector(__p0, __p0, 0, 1, 2, 3); 11095 return __ret; 11096 } 11097 #else 11098 __ai __attribute__((target("neon"))) uint16x4_t vget_low_u16(uint16x8_t __p0) { 11099 uint16x4_t __ret; 11100 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 11101 __ret = __builtin_shufflevector(__rev0, __rev0, 0, 1, 2, 3); 11102 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 11103 return __ret; 11104 } 11105 #endif 11106 11107 #ifdef __LITTLE_ENDIAN__ 11108 __ai __attribute__((target("neon"))) int8x8_t vget_low_s8(int8x16_t __p0) { 11109 int8x8_t __ret; 11110 __ret = __builtin_shufflevector(__p0, __p0, 0, 1, 2, 3, 4, 5, 6, 7); 11111 return __ret; 11112 } 11113 #else 11114 __ai __attribute__((target("neon"))) int8x8_t vget_low_s8(int8x16_t __p0) { 11115 int8x8_t __ret; 11116 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 11117 __ret = __builtin_shufflevector(__rev0, __rev0, 0, 1, 2, 3, 4, 5, 6, 7); 11118 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 11119 return __ret; 11120 } 11121 #endif 11122 11123 #ifdef __LITTLE_ENDIAN__ 11124 __ai __attribute__((target("neon"))) float32x2_t vget_low_f32(float32x4_t __p0) { 11125 float32x2_t __ret; 11126 __ret = __builtin_shufflevector(__p0, __p0, 0, 1); 11127 return __ret; 11128 } 11129 #else 11130 __ai __attribute__((target("neon"))) float32x2_t vget_low_f32(float32x4_t __p0) { 11131 float32x2_t __ret; 11132 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 11133 __ret = __builtin_shufflevector(__rev0, __rev0, 0, 1); 11134 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 11135 return __ret; 11136 } 11137 #endif 11138 11139 #ifdef __LITTLE_ENDIAN__ 11140 __ai __attribute__((target("neon"))) float16x4_t vget_low_f16(float16x8_t __p0) { 11141 float16x4_t __ret; 11142 __ret = __builtin_shufflevector(__p0, __p0, 0, 1, 2, 3); 11143 return __ret; 11144 } 11145 #else 11146 __ai __attribute__((target("neon"))) float16x4_t vget_low_f16(float16x8_t __p0) { 11147 float16x4_t __ret; 11148 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 11149 __ret = __builtin_shufflevector(__rev0, __rev0, 0, 1, 2, 3); 11150 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 11151 return __ret; 11152 } 11153 #endif 11154 11155 #ifdef __LITTLE_ENDIAN__ 11156 __ai __attribute__((target("neon"))) int32x2_t vget_low_s32(int32x4_t __p0) { 11157 int32x2_t __ret; 11158 __ret = __builtin_shufflevector(__p0, __p0, 0, 1); 11159 return __ret; 11160 } 11161 #else 11162 __ai __attribute__((target("neon"))) int32x2_t vget_low_s32(int32x4_t __p0) { 11163 int32x2_t __ret; 11164 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 11165 __ret = __builtin_shufflevector(__rev0, __rev0, 0, 1); 11166 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 11167 return __ret; 11168 } 11169 #endif 11170 11171 #ifdef __LITTLE_ENDIAN__ 11172 __ai __attribute__((target("neon"))) int64x1_t vget_low_s64(int64x2_t __p0) { 11173 int64x1_t __ret; 11174 __ret = __builtin_shufflevector(__p0, __p0, 0); 11175 return __ret; 11176 } 11177 #else 11178 __ai __attribute__((target("neon"))) int64x1_t vget_low_s64(int64x2_t __p0) { 11179 int64x1_t __ret; 11180 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 11181 __ret = __builtin_shufflevector(__rev0, __rev0, 0); 11182 return __ret; 11183 } 11184 #endif 11185 11186 #ifdef __LITTLE_ENDIAN__ 11187 __ai __attribute__((target("neon"))) int16x4_t vget_low_s16(int16x8_t __p0) { 11188 int16x4_t __ret; 11189 __ret = __builtin_shufflevector(__p0, __p0, 0, 1, 2, 3); 11190 return __ret; 11191 } 11192 #else 11193 __ai __attribute__((target("neon"))) int16x4_t vget_low_s16(int16x8_t __p0) { 11194 int16x4_t __ret; 11195 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 11196 __ret = __builtin_shufflevector(__rev0, __rev0, 0, 1, 2, 3); 11197 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 11198 return __ret; 11199 } 11200 #endif 11201 11202 #ifdef __LITTLE_ENDIAN__ 11203 __ai __attribute__((target("neon"))) uint8x16_t vhaddq_u8(uint8x16_t __p0, uint8x16_t __p1) { 11204 uint8x16_t __ret; 11205 __ret = (uint8x16_t) __builtin_neon_vhaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 48); 11206 return __ret; 11207 } 11208 #else 11209 __ai __attribute__((target("neon"))) uint8x16_t vhaddq_u8(uint8x16_t __p0, uint8x16_t __p1) { 11210 uint8x16_t __ret; 11211 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 11212 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 11213 __ret = (uint8x16_t) __builtin_neon_vhaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48); 11214 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 11215 return __ret; 11216 } 11217 #endif 11218 11219 #ifdef __LITTLE_ENDIAN__ 11220 __ai __attribute__((target("neon"))) uint32x4_t vhaddq_u32(uint32x4_t __p0, uint32x4_t __p1) { 11221 uint32x4_t __ret; 11222 __ret = (uint32x4_t) __builtin_neon_vhaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 50); 11223 return __ret; 11224 } 11225 #else 11226 __ai __attribute__((target("neon"))) uint32x4_t vhaddq_u32(uint32x4_t __p0, uint32x4_t __p1) { 11227 uint32x4_t __ret; 11228 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 11229 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 11230 __ret = (uint32x4_t) __builtin_neon_vhaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50); 11231 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 11232 return __ret; 11233 } 11234 #endif 11235 11236 #ifdef __LITTLE_ENDIAN__ 11237 __ai __attribute__((target("neon"))) uint16x8_t vhaddq_u16(uint16x8_t __p0, uint16x8_t __p1) { 11238 uint16x8_t __ret; 11239 __ret = (uint16x8_t) __builtin_neon_vhaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 49); 11240 return __ret; 11241 } 11242 #else 11243 __ai __attribute__((target("neon"))) uint16x8_t vhaddq_u16(uint16x8_t __p0, uint16x8_t __p1) { 11244 uint16x8_t __ret; 11245 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 11246 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 11247 __ret = (uint16x8_t) __builtin_neon_vhaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49); 11248 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 11249 return __ret; 11250 } 11251 #endif 11252 11253 #ifdef __LITTLE_ENDIAN__ 11254 __ai __attribute__((target("neon"))) int8x16_t vhaddq_s8(int8x16_t __p0, int8x16_t __p1) { 11255 int8x16_t __ret; 11256 __ret = (int8x16_t) __builtin_neon_vhaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 32); 11257 return __ret; 11258 } 11259 #else 11260 __ai __attribute__((target("neon"))) int8x16_t vhaddq_s8(int8x16_t __p0, int8x16_t __p1) { 11261 int8x16_t __ret; 11262 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 11263 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 11264 __ret = (int8x16_t) __builtin_neon_vhaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32); 11265 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 11266 return __ret; 11267 } 11268 #endif 11269 11270 #ifdef __LITTLE_ENDIAN__ 11271 __ai __attribute__((target("neon"))) int32x4_t vhaddq_s32(int32x4_t __p0, int32x4_t __p1) { 11272 int32x4_t __ret; 11273 __ret = (int32x4_t) __builtin_neon_vhaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 34); 11274 return __ret; 11275 } 11276 #else 11277 __ai __attribute__((target("neon"))) int32x4_t vhaddq_s32(int32x4_t __p0, int32x4_t __p1) { 11278 int32x4_t __ret; 11279 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 11280 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 11281 __ret = (int32x4_t) __builtin_neon_vhaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34); 11282 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 11283 return __ret; 11284 } 11285 #endif 11286 11287 #ifdef __LITTLE_ENDIAN__ 11288 __ai __attribute__((target("neon"))) int16x8_t vhaddq_s16(int16x8_t __p0, int16x8_t __p1) { 11289 int16x8_t __ret; 11290 __ret = (int16x8_t) __builtin_neon_vhaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 33); 11291 return __ret; 11292 } 11293 #else 11294 __ai __attribute__((target("neon"))) int16x8_t vhaddq_s16(int16x8_t __p0, int16x8_t __p1) { 11295 int16x8_t __ret; 11296 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 11297 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 11298 __ret = (int16x8_t) __builtin_neon_vhaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33); 11299 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 11300 return __ret; 11301 } 11302 #endif 11303 11304 #ifdef __LITTLE_ENDIAN__ 11305 __ai __attribute__((target("neon"))) uint8x8_t vhadd_u8(uint8x8_t __p0, uint8x8_t __p1) { 11306 uint8x8_t __ret; 11307 __ret = (uint8x8_t) __builtin_neon_vhadd_v((int8x8_t)__p0, (int8x8_t)__p1, 16); 11308 return __ret; 11309 } 11310 #else 11311 __ai __attribute__((target("neon"))) uint8x8_t vhadd_u8(uint8x8_t __p0, uint8x8_t __p1) { 11312 uint8x8_t __ret; 11313 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 11314 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 11315 __ret = (uint8x8_t) __builtin_neon_vhadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16); 11316 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 11317 return __ret; 11318 } 11319 #endif 11320 11321 #ifdef __LITTLE_ENDIAN__ 11322 __ai __attribute__((target("neon"))) uint32x2_t vhadd_u32(uint32x2_t __p0, uint32x2_t __p1) { 11323 uint32x2_t __ret; 11324 __ret = (uint32x2_t) __builtin_neon_vhadd_v((int8x8_t)__p0, (int8x8_t)__p1, 18); 11325 return __ret; 11326 } 11327 #else 11328 __ai __attribute__((target("neon"))) uint32x2_t vhadd_u32(uint32x2_t __p0, uint32x2_t __p1) { 11329 uint32x2_t __ret; 11330 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 11331 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 11332 __ret = (uint32x2_t) __builtin_neon_vhadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18); 11333 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 11334 return __ret; 11335 } 11336 #endif 11337 11338 #ifdef __LITTLE_ENDIAN__ 11339 __ai __attribute__((target("neon"))) uint16x4_t vhadd_u16(uint16x4_t __p0, uint16x4_t __p1) { 11340 uint16x4_t __ret; 11341 __ret = (uint16x4_t) __builtin_neon_vhadd_v((int8x8_t)__p0, (int8x8_t)__p1, 17); 11342 return __ret; 11343 } 11344 #else 11345 __ai __attribute__((target("neon"))) uint16x4_t vhadd_u16(uint16x4_t __p0, uint16x4_t __p1) { 11346 uint16x4_t __ret; 11347 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 11348 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 11349 __ret = (uint16x4_t) __builtin_neon_vhadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17); 11350 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 11351 return __ret; 11352 } 11353 #endif 11354 11355 #ifdef __LITTLE_ENDIAN__ 11356 __ai __attribute__((target("neon"))) int8x8_t vhadd_s8(int8x8_t __p0, int8x8_t __p1) { 11357 int8x8_t __ret; 11358 __ret = (int8x8_t) __builtin_neon_vhadd_v((int8x8_t)__p0, (int8x8_t)__p1, 0); 11359 return __ret; 11360 } 11361 #else 11362 __ai __attribute__((target("neon"))) int8x8_t vhadd_s8(int8x8_t __p0, int8x8_t __p1) { 11363 int8x8_t __ret; 11364 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 11365 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 11366 __ret = (int8x8_t) __builtin_neon_vhadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0); 11367 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 11368 return __ret; 11369 } 11370 #endif 11371 11372 #ifdef __LITTLE_ENDIAN__ 11373 __ai __attribute__((target("neon"))) int32x2_t vhadd_s32(int32x2_t __p0, int32x2_t __p1) { 11374 int32x2_t __ret; 11375 __ret = (int32x2_t) __builtin_neon_vhadd_v((int8x8_t)__p0, (int8x8_t)__p1, 2); 11376 return __ret; 11377 } 11378 #else 11379 __ai __attribute__((target("neon"))) int32x2_t vhadd_s32(int32x2_t __p0, int32x2_t __p1) { 11380 int32x2_t __ret; 11381 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 11382 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 11383 __ret = (int32x2_t) __builtin_neon_vhadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2); 11384 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 11385 return __ret; 11386 } 11387 #endif 11388 11389 #ifdef __LITTLE_ENDIAN__ 11390 __ai __attribute__((target("neon"))) int16x4_t vhadd_s16(int16x4_t __p0, int16x4_t __p1) { 11391 int16x4_t __ret; 11392 __ret = (int16x4_t) __builtin_neon_vhadd_v((int8x8_t)__p0, (int8x8_t)__p1, 1); 11393 return __ret; 11394 } 11395 #else 11396 __ai __attribute__((target("neon"))) int16x4_t vhadd_s16(int16x4_t __p0, int16x4_t __p1) { 11397 int16x4_t __ret; 11398 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 11399 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 11400 __ret = (int16x4_t) __builtin_neon_vhadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1); 11401 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 11402 return __ret; 11403 } 11404 #endif 11405 11406 #ifdef __LITTLE_ENDIAN__ 11407 __ai __attribute__((target("neon"))) uint8x16_t vhsubq_u8(uint8x16_t __p0, uint8x16_t __p1) { 11408 uint8x16_t __ret; 11409 __ret = (uint8x16_t) __builtin_neon_vhsubq_v((int8x16_t)__p0, (int8x16_t)__p1, 48); 11410 return __ret; 11411 } 11412 #else 11413 __ai __attribute__((target("neon"))) uint8x16_t vhsubq_u8(uint8x16_t __p0, uint8x16_t __p1) { 11414 uint8x16_t __ret; 11415 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 11416 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 11417 __ret = (uint8x16_t) __builtin_neon_vhsubq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48); 11418 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 11419 return __ret; 11420 } 11421 #endif 11422 11423 #ifdef __LITTLE_ENDIAN__ 11424 __ai __attribute__((target("neon"))) uint32x4_t vhsubq_u32(uint32x4_t __p0, uint32x4_t __p1) { 11425 uint32x4_t __ret; 11426 __ret = (uint32x4_t) __builtin_neon_vhsubq_v((int8x16_t)__p0, (int8x16_t)__p1, 50); 11427 return __ret; 11428 } 11429 #else 11430 __ai __attribute__((target("neon"))) uint32x4_t vhsubq_u32(uint32x4_t __p0, uint32x4_t __p1) { 11431 uint32x4_t __ret; 11432 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 11433 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 11434 __ret = (uint32x4_t) __builtin_neon_vhsubq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50); 11435 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 11436 return __ret; 11437 } 11438 #endif 11439 11440 #ifdef __LITTLE_ENDIAN__ 11441 __ai __attribute__((target("neon"))) uint16x8_t vhsubq_u16(uint16x8_t __p0, uint16x8_t __p1) { 11442 uint16x8_t __ret; 11443 __ret = (uint16x8_t) __builtin_neon_vhsubq_v((int8x16_t)__p0, (int8x16_t)__p1, 49); 11444 return __ret; 11445 } 11446 #else 11447 __ai __attribute__((target("neon"))) uint16x8_t vhsubq_u16(uint16x8_t __p0, uint16x8_t __p1) { 11448 uint16x8_t __ret; 11449 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 11450 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 11451 __ret = (uint16x8_t) __builtin_neon_vhsubq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49); 11452 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 11453 return __ret; 11454 } 11455 #endif 11456 11457 #ifdef __LITTLE_ENDIAN__ 11458 __ai __attribute__((target("neon"))) int8x16_t vhsubq_s8(int8x16_t __p0, int8x16_t __p1) { 11459 int8x16_t __ret; 11460 __ret = (int8x16_t) __builtin_neon_vhsubq_v((int8x16_t)__p0, (int8x16_t)__p1, 32); 11461 return __ret; 11462 } 11463 #else 11464 __ai __attribute__((target("neon"))) int8x16_t vhsubq_s8(int8x16_t __p0, int8x16_t __p1) { 11465 int8x16_t __ret; 11466 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 11467 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 11468 __ret = (int8x16_t) __builtin_neon_vhsubq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32); 11469 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 11470 return __ret; 11471 } 11472 #endif 11473 11474 #ifdef __LITTLE_ENDIAN__ 11475 __ai __attribute__((target("neon"))) int32x4_t vhsubq_s32(int32x4_t __p0, int32x4_t __p1) { 11476 int32x4_t __ret; 11477 __ret = (int32x4_t) __builtin_neon_vhsubq_v((int8x16_t)__p0, (int8x16_t)__p1, 34); 11478 return __ret; 11479 } 11480 #else 11481 __ai __attribute__((target("neon"))) int32x4_t vhsubq_s32(int32x4_t __p0, int32x4_t __p1) { 11482 int32x4_t __ret; 11483 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 11484 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 11485 __ret = (int32x4_t) __builtin_neon_vhsubq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34); 11486 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 11487 return __ret; 11488 } 11489 #endif 11490 11491 #ifdef __LITTLE_ENDIAN__ 11492 __ai __attribute__((target("neon"))) int16x8_t vhsubq_s16(int16x8_t __p0, int16x8_t __p1) { 11493 int16x8_t __ret; 11494 __ret = (int16x8_t) __builtin_neon_vhsubq_v((int8x16_t)__p0, (int8x16_t)__p1, 33); 11495 return __ret; 11496 } 11497 #else 11498 __ai __attribute__((target("neon"))) int16x8_t vhsubq_s16(int16x8_t __p0, int16x8_t __p1) { 11499 int16x8_t __ret; 11500 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 11501 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 11502 __ret = (int16x8_t) __builtin_neon_vhsubq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33); 11503 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 11504 return __ret; 11505 } 11506 #endif 11507 11508 #ifdef __LITTLE_ENDIAN__ 11509 __ai __attribute__((target("neon"))) uint8x8_t vhsub_u8(uint8x8_t __p0, uint8x8_t __p1) { 11510 uint8x8_t __ret; 11511 __ret = (uint8x8_t) __builtin_neon_vhsub_v((int8x8_t)__p0, (int8x8_t)__p1, 16); 11512 return __ret; 11513 } 11514 #else 11515 __ai __attribute__((target("neon"))) uint8x8_t vhsub_u8(uint8x8_t __p0, uint8x8_t __p1) { 11516 uint8x8_t __ret; 11517 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 11518 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 11519 __ret = (uint8x8_t) __builtin_neon_vhsub_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16); 11520 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 11521 return __ret; 11522 } 11523 #endif 11524 11525 #ifdef __LITTLE_ENDIAN__ 11526 __ai __attribute__((target("neon"))) uint32x2_t vhsub_u32(uint32x2_t __p0, uint32x2_t __p1) { 11527 uint32x2_t __ret; 11528 __ret = (uint32x2_t) __builtin_neon_vhsub_v((int8x8_t)__p0, (int8x8_t)__p1, 18); 11529 return __ret; 11530 } 11531 #else 11532 __ai __attribute__((target("neon"))) uint32x2_t vhsub_u32(uint32x2_t __p0, uint32x2_t __p1) { 11533 uint32x2_t __ret; 11534 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 11535 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 11536 __ret = (uint32x2_t) __builtin_neon_vhsub_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18); 11537 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 11538 return __ret; 11539 } 11540 #endif 11541 11542 #ifdef __LITTLE_ENDIAN__ 11543 __ai __attribute__((target("neon"))) uint16x4_t vhsub_u16(uint16x4_t __p0, uint16x4_t __p1) { 11544 uint16x4_t __ret; 11545 __ret = (uint16x4_t) __builtin_neon_vhsub_v((int8x8_t)__p0, (int8x8_t)__p1, 17); 11546 return __ret; 11547 } 11548 #else 11549 __ai __attribute__((target("neon"))) uint16x4_t vhsub_u16(uint16x4_t __p0, uint16x4_t __p1) { 11550 uint16x4_t __ret; 11551 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 11552 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 11553 __ret = (uint16x4_t) __builtin_neon_vhsub_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17); 11554 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 11555 return __ret; 11556 } 11557 #endif 11558 11559 #ifdef __LITTLE_ENDIAN__ 11560 __ai __attribute__((target("neon"))) int8x8_t vhsub_s8(int8x8_t __p0, int8x8_t __p1) { 11561 int8x8_t __ret; 11562 __ret = (int8x8_t) __builtin_neon_vhsub_v((int8x8_t)__p0, (int8x8_t)__p1, 0); 11563 return __ret; 11564 } 11565 #else 11566 __ai __attribute__((target("neon"))) int8x8_t vhsub_s8(int8x8_t __p0, int8x8_t __p1) { 11567 int8x8_t __ret; 11568 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 11569 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 11570 __ret = (int8x8_t) __builtin_neon_vhsub_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0); 11571 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 11572 return __ret; 11573 } 11574 #endif 11575 11576 #ifdef __LITTLE_ENDIAN__ 11577 __ai __attribute__((target("neon"))) int32x2_t vhsub_s32(int32x2_t __p0, int32x2_t __p1) { 11578 int32x2_t __ret; 11579 __ret = (int32x2_t) __builtin_neon_vhsub_v((int8x8_t)__p0, (int8x8_t)__p1, 2); 11580 return __ret; 11581 } 11582 #else 11583 __ai __attribute__((target("neon"))) int32x2_t vhsub_s32(int32x2_t __p0, int32x2_t __p1) { 11584 int32x2_t __ret; 11585 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 11586 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 11587 __ret = (int32x2_t) __builtin_neon_vhsub_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2); 11588 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 11589 return __ret; 11590 } 11591 #endif 11592 11593 #ifdef __LITTLE_ENDIAN__ 11594 __ai __attribute__((target("neon"))) int16x4_t vhsub_s16(int16x4_t __p0, int16x4_t __p1) { 11595 int16x4_t __ret; 11596 __ret = (int16x4_t) __builtin_neon_vhsub_v((int8x8_t)__p0, (int8x8_t)__p1, 1); 11597 return __ret; 11598 } 11599 #else 11600 __ai __attribute__((target("neon"))) int16x4_t vhsub_s16(int16x4_t __p0, int16x4_t __p1) { 11601 int16x4_t __ret; 11602 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 11603 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 11604 __ret = (int16x4_t) __builtin_neon_vhsub_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1); 11605 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 11606 return __ret; 11607 } 11608 #endif 11609 11610 #ifdef __LITTLE_ENDIAN__ 11611 #define vld1_p8(__p0) __extension__ ({ \ 11612 poly8x8_t __ret; \ 11613 __ret = (poly8x8_t) __builtin_neon_vld1_v(__p0, 4); \ 11614 __ret; \ 11615 }) 11616 #else 11617 #define vld1_p8(__p0) __extension__ ({ \ 11618 poly8x8_t __ret; \ 11619 __ret = (poly8x8_t) __builtin_neon_vld1_v(__p0, 4); \ 11620 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 11621 __ret; \ 11622 }) 11623 #endif 11624 11625 #ifdef __LITTLE_ENDIAN__ 11626 #define vld1_p16(__p0) __extension__ ({ \ 11627 poly16x4_t __ret; \ 11628 __ret = (poly16x4_t) __builtin_neon_vld1_v(__p0, 5); \ 11629 __ret; \ 11630 }) 11631 #else 11632 #define vld1_p16(__p0) __extension__ ({ \ 11633 poly16x4_t __ret; \ 11634 __ret = (poly16x4_t) __builtin_neon_vld1_v(__p0, 5); \ 11635 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 11636 __ret; \ 11637 }) 11638 #endif 11639 11640 #ifdef __LITTLE_ENDIAN__ 11641 #define vld1q_p8(__p0) __extension__ ({ \ 11642 poly8x16_t __ret; \ 11643 __ret = (poly8x16_t) __builtin_neon_vld1q_v(__p0, 36); \ 11644 __ret; \ 11645 }) 11646 #else 11647 #define vld1q_p8(__p0) __extension__ ({ \ 11648 poly8x16_t __ret; \ 11649 __ret = (poly8x16_t) __builtin_neon_vld1q_v(__p0, 36); \ 11650 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 11651 __ret; \ 11652 }) 11653 #endif 11654 11655 #ifdef __LITTLE_ENDIAN__ 11656 #define vld1q_p16(__p0) __extension__ ({ \ 11657 poly16x8_t __ret; \ 11658 __ret = (poly16x8_t) __builtin_neon_vld1q_v(__p0, 37); \ 11659 __ret; \ 11660 }) 11661 #else 11662 #define vld1q_p16(__p0) __extension__ ({ \ 11663 poly16x8_t __ret; \ 11664 __ret = (poly16x8_t) __builtin_neon_vld1q_v(__p0, 37); \ 11665 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 11666 __ret; \ 11667 }) 11668 #endif 11669 11670 #ifdef __LITTLE_ENDIAN__ 11671 #define vld1q_u8(__p0) __extension__ ({ \ 11672 uint8x16_t __ret; \ 11673 __ret = (uint8x16_t) __builtin_neon_vld1q_v(__p0, 48); \ 11674 __ret; \ 11675 }) 11676 #else 11677 #define vld1q_u8(__p0) __extension__ ({ \ 11678 uint8x16_t __ret; \ 11679 __ret = (uint8x16_t) __builtin_neon_vld1q_v(__p0, 48); \ 11680 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 11681 __ret; \ 11682 }) 11683 #endif 11684 11685 #ifdef __LITTLE_ENDIAN__ 11686 #define vld1q_u32(__p0) __extension__ ({ \ 11687 uint32x4_t __ret; \ 11688 __ret = (uint32x4_t) __builtin_neon_vld1q_v(__p0, 50); \ 11689 __ret; \ 11690 }) 11691 #else 11692 #define vld1q_u32(__p0) __extension__ ({ \ 11693 uint32x4_t __ret; \ 11694 __ret = (uint32x4_t) __builtin_neon_vld1q_v(__p0, 50); \ 11695 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 11696 __ret; \ 11697 }) 11698 #endif 11699 11700 #ifdef __LITTLE_ENDIAN__ 11701 #define vld1q_u64(__p0) __extension__ ({ \ 11702 uint64x2_t __ret; \ 11703 __ret = (uint64x2_t) __builtin_neon_vld1q_v(__p0, 51); \ 11704 __ret; \ 11705 }) 11706 #else 11707 #define vld1q_u64(__p0) __extension__ ({ \ 11708 uint64x2_t __ret; \ 11709 __ret = (uint64x2_t) __builtin_neon_vld1q_v(__p0, 51); \ 11710 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 11711 __ret; \ 11712 }) 11713 #endif 11714 11715 #ifdef __LITTLE_ENDIAN__ 11716 #define vld1q_u16(__p0) __extension__ ({ \ 11717 uint16x8_t __ret; \ 11718 __ret = (uint16x8_t) __builtin_neon_vld1q_v(__p0, 49); \ 11719 __ret; \ 11720 }) 11721 #else 11722 #define vld1q_u16(__p0) __extension__ ({ \ 11723 uint16x8_t __ret; \ 11724 __ret = (uint16x8_t) __builtin_neon_vld1q_v(__p0, 49); \ 11725 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 11726 __ret; \ 11727 }) 11728 #endif 11729 11730 #ifdef __LITTLE_ENDIAN__ 11731 #define vld1q_s8(__p0) __extension__ ({ \ 11732 int8x16_t __ret; \ 11733 __ret = (int8x16_t) __builtin_neon_vld1q_v(__p0, 32); \ 11734 __ret; \ 11735 }) 11736 #else 11737 #define vld1q_s8(__p0) __extension__ ({ \ 11738 int8x16_t __ret; \ 11739 __ret = (int8x16_t) __builtin_neon_vld1q_v(__p0, 32); \ 11740 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 11741 __ret; \ 11742 }) 11743 #endif 11744 11745 #ifdef __LITTLE_ENDIAN__ 11746 #define vld1q_f32(__p0) __extension__ ({ \ 11747 float32x4_t __ret; \ 11748 __ret = (float32x4_t) __builtin_neon_vld1q_v(__p0, 41); \ 11749 __ret; \ 11750 }) 11751 #else 11752 #define vld1q_f32(__p0) __extension__ ({ \ 11753 float32x4_t __ret; \ 11754 __ret = (float32x4_t) __builtin_neon_vld1q_v(__p0, 41); \ 11755 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 11756 __ret; \ 11757 }) 11758 #endif 11759 11760 #ifdef __LITTLE_ENDIAN__ 11761 #define vld1q_s32(__p0) __extension__ ({ \ 11762 int32x4_t __ret; \ 11763 __ret = (int32x4_t) __builtin_neon_vld1q_v(__p0, 34); \ 11764 __ret; \ 11765 }) 11766 #else 11767 #define vld1q_s32(__p0) __extension__ ({ \ 11768 int32x4_t __ret; \ 11769 __ret = (int32x4_t) __builtin_neon_vld1q_v(__p0, 34); \ 11770 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 11771 __ret; \ 11772 }) 11773 #endif 11774 11775 #ifdef __LITTLE_ENDIAN__ 11776 #define vld1q_s64(__p0) __extension__ ({ \ 11777 int64x2_t __ret; \ 11778 __ret = (int64x2_t) __builtin_neon_vld1q_v(__p0, 35); \ 11779 __ret; \ 11780 }) 11781 #else 11782 #define vld1q_s64(__p0) __extension__ ({ \ 11783 int64x2_t __ret; \ 11784 __ret = (int64x2_t) __builtin_neon_vld1q_v(__p0, 35); \ 11785 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 11786 __ret; \ 11787 }) 11788 #endif 11789 11790 #ifdef __LITTLE_ENDIAN__ 11791 #define vld1q_s16(__p0) __extension__ ({ \ 11792 int16x8_t __ret; \ 11793 __ret = (int16x8_t) __builtin_neon_vld1q_v(__p0, 33); \ 11794 __ret; \ 11795 }) 11796 #else 11797 #define vld1q_s16(__p0) __extension__ ({ \ 11798 int16x8_t __ret; \ 11799 __ret = (int16x8_t) __builtin_neon_vld1q_v(__p0, 33); \ 11800 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 11801 __ret; \ 11802 }) 11803 #endif 11804 11805 #ifdef __LITTLE_ENDIAN__ 11806 #define vld1_u8(__p0) __extension__ ({ \ 11807 uint8x8_t __ret; \ 11808 __ret = (uint8x8_t) __builtin_neon_vld1_v(__p0, 16); \ 11809 __ret; \ 11810 }) 11811 #else 11812 #define vld1_u8(__p0) __extension__ ({ \ 11813 uint8x8_t __ret; \ 11814 __ret = (uint8x8_t) __builtin_neon_vld1_v(__p0, 16); \ 11815 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 11816 __ret; \ 11817 }) 11818 #endif 11819 11820 #ifdef __LITTLE_ENDIAN__ 11821 #define vld1_u32(__p0) __extension__ ({ \ 11822 uint32x2_t __ret; \ 11823 __ret = (uint32x2_t) __builtin_neon_vld1_v(__p0, 18); \ 11824 __ret; \ 11825 }) 11826 #else 11827 #define vld1_u32(__p0) __extension__ ({ \ 11828 uint32x2_t __ret; \ 11829 __ret = (uint32x2_t) __builtin_neon_vld1_v(__p0, 18); \ 11830 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 11831 __ret; \ 11832 }) 11833 #endif 11834 11835 #define vld1_u64(__p0) __extension__ ({ \ 11836 uint64x1_t __ret; \ 11837 __ret = (uint64x1_t) __builtin_neon_vld1_v(__p0, 19); \ 11838 __ret; \ 11839 }) 11840 #ifdef __LITTLE_ENDIAN__ 11841 #define vld1_u16(__p0) __extension__ ({ \ 11842 uint16x4_t __ret; \ 11843 __ret = (uint16x4_t) __builtin_neon_vld1_v(__p0, 17); \ 11844 __ret; \ 11845 }) 11846 #else 11847 #define vld1_u16(__p0) __extension__ ({ \ 11848 uint16x4_t __ret; \ 11849 __ret = (uint16x4_t) __builtin_neon_vld1_v(__p0, 17); \ 11850 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 11851 __ret; \ 11852 }) 11853 #endif 11854 11855 #ifdef __LITTLE_ENDIAN__ 11856 #define vld1_s8(__p0) __extension__ ({ \ 11857 int8x8_t __ret; \ 11858 __ret = (int8x8_t) __builtin_neon_vld1_v(__p0, 0); \ 11859 __ret; \ 11860 }) 11861 #else 11862 #define vld1_s8(__p0) __extension__ ({ \ 11863 int8x8_t __ret; \ 11864 __ret = (int8x8_t) __builtin_neon_vld1_v(__p0, 0); \ 11865 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 11866 __ret; \ 11867 }) 11868 #endif 11869 11870 #ifdef __LITTLE_ENDIAN__ 11871 #define vld1_f32(__p0) __extension__ ({ \ 11872 float32x2_t __ret; \ 11873 __ret = (float32x2_t) __builtin_neon_vld1_v(__p0, 9); \ 11874 __ret; \ 11875 }) 11876 #else 11877 #define vld1_f32(__p0) __extension__ ({ \ 11878 float32x2_t __ret; \ 11879 __ret = (float32x2_t) __builtin_neon_vld1_v(__p0, 9); \ 11880 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 11881 __ret; \ 11882 }) 11883 #endif 11884 11885 #ifdef __LITTLE_ENDIAN__ 11886 #define vld1_s32(__p0) __extension__ ({ \ 11887 int32x2_t __ret; \ 11888 __ret = (int32x2_t) __builtin_neon_vld1_v(__p0, 2); \ 11889 __ret; \ 11890 }) 11891 #else 11892 #define vld1_s32(__p0) __extension__ ({ \ 11893 int32x2_t __ret; \ 11894 __ret = (int32x2_t) __builtin_neon_vld1_v(__p0, 2); \ 11895 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 11896 __ret; \ 11897 }) 11898 #endif 11899 11900 #define vld1_s64(__p0) __extension__ ({ \ 11901 int64x1_t __ret; \ 11902 __ret = (int64x1_t) __builtin_neon_vld1_v(__p0, 3); \ 11903 __ret; \ 11904 }) 11905 #ifdef __LITTLE_ENDIAN__ 11906 #define vld1_s16(__p0) __extension__ ({ \ 11907 int16x4_t __ret; \ 11908 __ret = (int16x4_t) __builtin_neon_vld1_v(__p0, 1); \ 11909 __ret; \ 11910 }) 11911 #else 11912 #define vld1_s16(__p0) __extension__ ({ \ 11913 int16x4_t __ret; \ 11914 __ret = (int16x4_t) __builtin_neon_vld1_v(__p0, 1); \ 11915 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 11916 __ret; \ 11917 }) 11918 #endif 11919 11920 #ifdef __LITTLE_ENDIAN__ 11921 #define vld1_dup_p8(__p0) __extension__ ({ \ 11922 poly8x8_t __ret; \ 11923 __ret = (poly8x8_t) __builtin_neon_vld1_dup_v(__p0, 4); \ 11924 __ret; \ 11925 }) 11926 #else 11927 #define vld1_dup_p8(__p0) __extension__ ({ \ 11928 poly8x8_t __ret; \ 11929 __ret = (poly8x8_t) __builtin_neon_vld1_dup_v(__p0, 4); \ 11930 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 11931 __ret; \ 11932 }) 11933 #endif 11934 11935 #ifdef __LITTLE_ENDIAN__ 11936 #define vld1_dup_p16(__p0) __extension__ ({ \ 11937 poly16x4_t __ret; \ 11938 __ret = (poly16x4_t) __builtin_neon_vld1_dup_v(__p0, 5); \ 11939 __ret; \ 11940 }) 11941 #else 11942 #define vld1_dup_p16(__p0) __extension__ ({ \ 11943 poly16x4_t __ret; \ 11944 __ret = (poly16x4_t) __builtin_neon_vld1_dup_v(__p0, 5); \ 11945 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 11946 __ret; \ 11947 }) 11948 #endif 11949 11950 #ifdef __LITTLE_ENDIAN__ 11951 #define vld1q_dup_p8(__p0) __extension__ ({ \ 11952 poly8x16_t __ret; \ 11953 __ret = (poly8x16_t) __builtin_neon_vld1q_dup_v(__p0, 36); \ 11954 __ret; \ 11955 }) 11956 #else 11957 #define vld1q_dup_p8(__p0) __extension__ ({ \ 11958 poly8x16_t __ret; \ 11959 __ret = (poly8x16_t) __builtin_neon_vld1q_dup_v(__p0, 36); \ 11960 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 11961 __ret; \ 11962 }) 11963 #endif 11964 11965 #ifdef __LITTLE_ENDIAN__ 11966 #define vld1q_dup_p16(__p0) __extension__ ({ \ 11967 poly16x8_t __ret; \ 11968 __ret = (poly16x8_t) __builtin_neon_vld1q_dup_v(__p0, 37); \ 11969 __ret; \ 11970 }) 11971 #else 11972 #define vld1q_dup_p16(__p0) __extension__ ({ \ 11973 poly16x8_t __ret; \ 11974 __ret = (poly16x8_t) __builtin_neon_vld1q_dup_v(__p0, 37); \ 11975 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 11976 __ret; \ 11977 }) 11978 #endif 11979 11980 #ifdef __LITTLE_ENDIAN__ 11981 #define vld1q_dup_u8(__p0) __extension__ ({ \ 11982 uint8x16_t __ret; \ 11983 __ret = (uint8x16_t) __builtin_neon_vld1q_dup_v(__p0, 48); \ 11984 __ret; \ 11985 }) 11986 #else 11987 #define vld1q_dup_u8(__p0) __extension__ ({ \ 11988 uint8x16_t __ret; \ 11989 __ret = (uint8x16_t) __builtin_neon_vld1q_dup_v(__p0, 48); \ 11990 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 11991 __ret; \ 11992 }) 11993 #endif 11994 11995 #ifdef __LITTLE_ENDIAN__ 11996 #define vld1q_dup_u32(__p0) __extension__ ({ \ 11997 uint32x4_t __ret; \ 11998 __ret = (uint32x4_t) __builtin_neon_vld1q_dup_v(__p0, 50); \ 11999 __ret; \ 12000 }) 12001 #else 12002 #define vld1q_dup_u32(__p0) __extension__ ({ \ 12003 uint32x4_t __ret; \ 12004 __ret = (uint32x4_t) __builtin_neon_vld1q_dup_v(__p0, 50); \ 12005 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 12006 __ret; \ 12007 }) 12008 #endif 12009 12010 #ifdef __LITTLE_ENDIAN__ 12011 #define vld1q_dup_u64(__p0) __extension__ ({ \ 12012 uint64x2_t __ret; \ 12013 __ret = (uint64x2_t) __builtin_neon_vld1q_dup_v(__p0, 51); \ 12014 __ret; \ 12015 }) 12016 #else 12017 #define vld1q_dup_u64(__p0) __extension__ ({ \ 12018 uint64x2_t __ret; \ 12019 __ret = (uint64x2_t) __builtin_neon_vld1q_dup_v(__p0, 51); \ 12020 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 12021 __ret; \ 12022 }) 12023 #endif 12024 12025 #ifdef __LITTLE_ENDIAN__ 12026 #define vld1q_dup_u16(__p0) __extension__ ({ \ 12027 uint16x8_t __ret; \ 12028 __ret = (uint16x8_t) __builtin_neon_vld1q_dup_v(__p0, 49); \ 12029 __ret; \ 12030 }) 12031 #else 12032 #define vld1q_dup_u16(__p0) __extension__ ({ \ 12033 uint16x8_t __ret; \ 12034 __ret = (uint16x8_t) __builtin_neon_vld1q_dup_v(__p0, 49); \ 12035 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 12036 __ret; \ 12037 }) 12038 #endif 12039 12040 #ifdef __LITTLE_ENDIAN__ 12041 #define vld1q_dup_s8(__p0) __extension__ ({ \ 12042 int8x16_t __ret; \ 12043 __ret = (int8x16_t) __builtin_neon_vld1q_dup_v(__p0, 32); \ 12044 __ret; \ 12045 }) 12046 #else 12047 #define vld1q_dup_s8(__p0) __extension__ ({ \ 12048 int8x16_t __ret; \ 12049 __ret = (int8x16_t) __builtin_neon_vld1q_dup_v(__p0, 32); \ 12050 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 12051 __ret; \ 12052 }) 12053 #endif 12054 12055 #ifdef __LITTLE_ENDIAN__ 12056 #define vld1q_dup_f32(__p0) __extension__ ({ \ 12057 float32x4_t __ret; \ 12058 __ret = (float32x4_t) __builtin_neon_vld1q_dup_v(__p0, 41); \ 12059 __ret; \ 12060 }) 12061 #else 12062 #define vld1q_dup_f32(__p0) __extension__ ({ \ 12063 float32x4_t __ret; \ 12064 __ret = (float32x4_t) __builtin_neon_vld1q_dup_v(__p0, 41); \ 12065 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 12066 __ret; \ 12067 }) 12068 #endif 12069 12070 #ifdef __LITTLE_ENDIAN__ 12071 #define vld1q_dup_s32(__p0) __extension__ ({ \ 12072 int32x4_t __ret; \ 12073 __ret = (int32x4_t) __builtin_neon_vld1q_dup_v(__p0, 34); \ 12074 __ret; \ 12075 }) 12076 #else 12077 #define vld1q_dup_s32(__p0) __extension__ ({ \ 12078 int32x4_t __ret; \ 12079 __ret = (int32x4_t) __builtin_neon_vld1q_dup_v(__p0, 34); \ 12080 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 12081 __ret; \ 12082 }) 12083 #endif 12084 12085 #ifdef __LITTLE_ENDIAN__ 12086 #define vld1q_dup_s64(__p0) __extension__ ({ \ 12087 int64x2_t __ret; \ 12088 __ret = (int64x2_t) __builtin_neon_vld1q_dup_v(__p0, 35); \ 12089 __ret; \ 12090 }) 12091 #else 12092 #define vld1q_dup_s64(__p0) __extension__ ({ \ 12093 int64x2_t __ret; \ 12094 __ret = (int64x2_t) __builtin_neon_vld1q_dup_v(__p0, 35); \ 12095 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 12096 __ret; \ 12097 }) 12098 #endif 12099 12100 #ifdef __LITTLE_ENDIAN__ 12101 #define vld1q_dup_s16(__p0) __extension__ ({ \ 12102 int16x8_t __ret; \ 12103 __ret = (int16x8_t) __builtin_neon_vld1q_dup_v(__p0, 33); \ 12104 __ret; \ 12105 }) 12106 #else 12107 #define vld1q_dup_s16(__p0) __extension__ ({ \ 12108 int16x8_t __ret; \ 12109 __ret = (int16x8_t) __builtin_neon_vld1q_dup_v(__p0, 33); \ 12110 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 12111 __ret; \ 12112 }) 12113 #endif 12114 12115 #ifdef __LITTLE_ENDIAN__ 12116 #define vld1_dup_u8(__p0) __extension__ ({ \ 12117 uint8x8_t __ret; \ 12118 __ret = (uint8x8_t) __builtin_neon_vld1_dup_v(__p0, 16); \ 12119 __ret; \ 12120 }) 12121 #else 12122 #define vld1_dup_u8(__p0) __extension__ ({ \ 12123 uint8x8_t __ret; \ 12124 __ret = (uint8x8_t) __builtin_neon_vld1_dup_v(__p0, 16); \ 12125 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 12126 __ret; \ 12127 }) 12128 #endif 12129 12130 #ifdef __LITTLE_ENDIAN__ 12131 #define vld1_dup_u32(__p0) __extension__ ({ \ 12132 uint32x2_t __ret; \ 12133 __ret = (uint32x2_t) __builtin_neon_vld1_dup_v(__p0, 18); \ 12134 __ret; \ 12135 }) 12136 #else 12137 #define vld1_dup_u32(__p0) __extension__ ({ \ 12138 uint32x2_t __ret; \ 12139 __ret = (uint32x2_t) __builtin_neon_vld1_dup_v(__p0, 18); \ 12140 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 12141 __ret; \ 12142 }) 12143 #endif 12144 12145 #define vld1_dup_u64(__p0) __extension__ ({ \ 12146 uint64x1_t __ret; \ 12147 __ret = (uint64x1_t) __builtin_neon_vld1_dup_v(__p0, 19); \ 12148 __ret; \ 12149 }) 12150 #ifdef __LITTLE_ENDIAN__ 12151 #define vld1_dup_u16(__p0) __extension__ ({ \ 12152 uint16x4_t __ret; \ 12153 __ret = (uint16x4_t) __builtin_neon_vld1_dup_v(__p0, 17); \ 12154 __ret; \ 12155 }) 12156 #else 12157 #define vld1_dup_u16(__p0) __extension__ ({ \ 12158 uint16x4_t __ret; \ 12159 __ret = (uint16x4_t) __builtin_neon_vld1_dup_v(__p0, 17); \ 12160 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 12161 __ret; \ 12162 }) 12163 #endif 12164 12165 #ifdef __LITTLE_ENDIAN__ 12166 #define vld1_dup_s8(__p0) __extension__ ({ \ 12167 int8x8_t __ret; \ 12168 __ret = (int8x8_t) __builtin_neon_vld1_dup_v(__p0, 0); \ 12169 __ret; \ 12170 }) 12171 #else 12172 #define vld1_dup_s8(__p0) __extension__ ({ \ 12173 int8x8_t __ret; \ 12174 __ret = (int8x8_t) __builtin_neon_vld1_dup_v(__p0, 0); \ 12175 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 12176 __ret; \ 12177 }) 12178 #endif 12179 12180 #ifdef __LITTLE_ENDIAN__ 12181 #define vld1_dup_f32(__p0) __extension__ ({ \ 12182 float32x2_t __ret; \ 12183 __ret = (float32x2_t) __builtin_neon_vld1_dup_v(__p0, 9); \ 12184 __ret; \ 12185 }) 12186 #else 12187 #define vld1_dup_f32(__p0) __extension__ ({ \ 12188 float32x2_t __ret; \ 12189 __ret = (float32x2_t) __builtin_neon_vld1_dup_v(__p0, 9); \ 12190 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 12191 __ret; \ 12192 }) 12193 #endif 12194 12195 #ifdef __LITTLE_ENDIAN__ 12196 #define vld1_dup_s32(__p0) __extension__ ({ \ 12197 int32x2_t __ret; \ 12198 __ret = (int32x2_t) __builtin_neon_vld1_dup_v(__p0, 2); \ 12199 __ret; \ 12200 }) 12201 #else 12202 #define vld1_dup_s32(__p0) __extension__ ({ \ 12203 int32x2_t __ret; \ 12204 __ret = (int32x2_t) __builtin_neon_vld1_dup_v(__p0, 2); \ 12205 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 12206 __ret; \ 12207 }) 12208 #endif 12209 12210 #define vld1_dup_s64(__p0) __extension__ ({ \ 12211 int64x1_t __ret; \ 12212 __ret = (int64x1_t) __builtin_neon_vld1_dup_v(__p0, 3); \ 12213 __ret; \ 12214 }) 12215 #ifdef __LITTLE_ENDIAN__ 12216 #define vld1_dup_s16(__p0) __extension__ ({ \ 12217 int16x4_t __ret; \ 12218 __ret = (int16x4_t) __builtin_neon_vld1_dup_v(__p0, 1); \ 12219 __ret; \ 12220 }) 12221 #else 12222 #define vld1_dup_s16(__p0) __extension__ ({ \ 12223 int16x4_t __ret; \ 12224 __ret = (int16x4_t) __builtin_neon_vld1_dup_v(__p0, 1); \ 12225 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 12226 __ret; \ 12227 }) 12228 #endif 12229 12230 #ifdef __LITTLE_ENDIAN__ 12231 #define vld1_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 12232 poly8x8_t __ret; \ 12233 poly8x8_t __s1 = __p1; \ 12234 __ret = (poly8x8_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__s1, __p2, 4); \ 12235 __ret; \ 12236 }) 12237 #else 12238 #define vld1_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 12239 poly8x8_t __ret; \ 12240 poly8x8_t __s1 = __p1; \ 12241 poly8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 12242 __ret = (poly8x8_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__rev1, __p2, 4); \ 12243 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 12244 __ret; \ 12245 }) 12246 #endif 12247 12248 #ifdef __LITTLE_ENDIAN__ 12249 #define vld1_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 12250 poly16x4_t __ret; \ 12251 poly16x4_t __s1 = __p1; \ 12252 __ret = (poly16x4_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__s1, __p2, 5); \ 12253 __ret; \ 12254 }) 12255 #else 12256 #define vld1_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 12257 poly16x4_t __ret; \ 12258 poly16x4_t __s1 = __p1; \ 12259 poly16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 12260 __ret = (poly16x4_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__rev1, __p2, 5); \ 12261 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 12262 __ret; \ 12263 }) 12264 #endif 12265 12266 #ifdef __LITTLE_ENDIAN__ 12267 #define vld1q_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 12268 poly8x16_t __ret; \ 12269 poly8x16_t __s1 = __p1; \ 12270 __ret = (poly8x16_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__s1, __p2, 36); \ 12271 __ret; \ 12272 }) 12273 #else 12274 #define vld1q_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 12275 poly8x16_t __ret; \ 12276 poly8x16_t __s1 = __p1; \ 12277 poly8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 12278 __ret = (poly8x16_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 36); \ 12279 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 12280 __ret; \ 12281 }) 12282 #endif 12283 12284 #ifdef __LITTLE_ENDIAN__ 12285 #define vld1q_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 12286 poly16x8_t __ret; \ 12287 poly16x8_t __s1 = __p1; \ 12288 __ret = (poly16x8_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__s1, __p2, 37); \ 12289 __ret; \ 12290 }) 12291 #else 12292 #define vld1q_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 12293 poly16x8_t __ret; \ 12294 poly16x8_t __s1 = __p1; \ 12295 poly16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 12296 __ret = (poly16x8_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 37); \ 12297 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 12298 __ret; \ 12299 }) 12300 #endif 12301 12302 #ifdef __LITTLE_ENDIAN__ 12303 #define vld1q_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 12304 uint8x16_t __ret; \ 12305 uint8x16_t __s1 = __p1; \ 12306 __ret = (uint8x16_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__s1, __p2, 48); \ 12307 __ret; \ 12308 }) 12309 #else 12310 #define vld1q_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 12311 uint8x16_t __ret; \ 12312 uint8x16_t __s1 = __p1; \ 12313 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 12314 __ret = (uint8x16_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 48); \ 12315 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 12316 __ret; \ 12317 }) 12318 #endif 12319 12320 #ifdef __LITTLE_ENDIAN__ 12321 #define vld1q_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 12322 uint32x4_t __ret; \ 12323 uint32x4_t __s1 = __p1; \ 12324 __ret = (uint32x4_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__s1, __p2, 50); \ 12325 __ret; \ 12326 }) 12327 #else 12328 #define vld1q_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 12329 uint32x4_t __ret; \ 12330 uint32x4_t __s1 = __p1; \ 12331 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 12332 __ret = (uint32x4_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 50); \ 12333 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 12334 __ret; \ 12335 }) 12336 #endif 12337 12338 #ifdef __LITTLE_ENDIAN__ 12339 #define vld1q_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 12340 uint64x2_t __ret; \ 12341 uint64x2_t __s1 = __p1; \ 12342 __ret = (uint64x2_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__s1, __p2, 51); \ 12343 __ret; \ 12344 }) 12345 #else 12346 #define vld1q_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 12347 uint64x2_t __ret; \ 12348 uint64x2_t __s1 = __p1; \ 12349 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 12350 __ret = (uint64x2_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 51); \ 12351 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 12352 __ret; \ 12353 }) 12354 #endif 12355 12356 #ifdef __LITTLE_ENDIAN__ 12357 #define vld1q_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 12358 uint16x8_t __ret; \ 12359 uint16x8_t __s1 = __p1; \ 12360 __ret = (uint16x8_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__s1, __p2, 49); \ 12361 __ret; \ 12362 }) 12363 #else 12364 #define vld1q_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 12365 uint16x8_t __ret; \ 12366 uint16x8_t __s1 = __p1; \ 12367 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 12368 __ret = (uint16x8_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 49); \ 12369 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 12370 __ret; \ 12371 }) 12372 #endif 12373 12374 #ifdef __LITTLE_ENDIAN__ 12375 #define vld1q_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 12376 int8x16_t __ret; \ 12377 int8x16_t __s1 = __p1; \ 12378 __ret = (int8x16_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__s1, __p2, 32); \ 12379 __ret; \ 12380 }) 12381 #else 12382 #define vld1q_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 12383 int8x16_t __ret; \ 12384 int8x16_t __s1 = __p1; \ 12385 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 12386 __ret = (int8x16_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 32); \ 12387 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 12388 __ret; \ 12389 }) 12390 #endif 12391 12392 #ifdef __LITTLE_ENDIAN__ 12393 #define vld1q_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 12394 float32x4_t __ret; \ 12395 float32x4_t __s1 = __p1; \ 12396 __ret = (float32x4_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__s1, __p2, 41); \ 12397 __ret; \ 12398 }) 12399 #else 12400 #define vld1q_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 12401 float32x4_t __ret; \ 12402 float32x4_t __s1 = __p1; \ 12403 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 12404 __ret = (float32x4_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 41); \ 12405 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 12406 __ret; \ 12407 }) 12408 #endif 12409 12410 #ifdef __LITTLE_ENDIAN__ 12411 #define vld1q_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 12412 int32x4_t __ret; \ 12413 int32x4_t __s1 = __p1; \ 12414 __ret = (int32x4_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__s1, __p2, 34); \ 12415 __ret; \ 12416 }) 12417 #else 12418 #define vld1q_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 12419 int32x4_t __ret; \ 12420 int32x4_t __s1 = __p1; \ 12421 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 12422 __ret = (int32x4_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 34); \ 12423 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 12424 __ret; \ 12425 }) 12426 #endif 12427 12428 #ifdef __LITTLE_ENDIAN__ 12429 #define vld1q_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 12430 int64x2_t __ret; \ 12431 int64x2_t __s1 = __p1; \ 12432 __ret = (int64x2_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__s1, __p2, 35); \ 12433 __ret; \ 12434 }) 12435 #else 12436 #define vld1q_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 12437 int64x2_t __ret; \ 12438 int64x2_t __s1 = __p1; \ 12439 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 12440 __ret = (int64x2_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 35); \ 12441 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 12442 __ret; \ 12443 }) 12444 #endif 12445 12446 #ifdef __LITTLE_ENDIAN__ 12447 #define vld1q_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 12448 int16x8_t __ret; \ 12449 int16x8_t __s1 = __p1; \ 12450 __ret = (int16x8_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__s1, __p2, 33); \ 12451 __ret; \ 12452 }) 12453 #else 12454 #define vld1q_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 12455 int16x8_t __ret; \ 12456 int16x8_t __s1 = __p1; \ 12457 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 12458 __ret = (int16x8_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 33); \ 12459 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 12460 __ret; \ 12461 }) 12462 #endif 12463 12464 #ifdef __LITTLE_ENDIAN__ 12465 #define vld1_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 12466 uint8x8_t __ret; \ 12467 uint8x8_t __s1 = __p1; \ 12468 __ret = (uint8x8_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__s1, __p2, 16); \ 12469 __ret; \ 12470 }) 12471 #else 12472 #define vld1_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 12473 uint8x8_t __ret; \ 12474 uint8x8_t __s1 = __p1; \ 12475 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 12476 __ret = (uint8x8_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__rev1, __p2, 16); \ 12477 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 12478 __ret; \ 12479 }) 12480 #endif 12481 12482 #ifdef __LITTLE_ENDIAN__ 12483 #define vld1_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 12484 uint32x2_t __ret; \ 12485 uint32x2_t __s1 = __p1; \ 12486 __ret = (uint32x2_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__s1, __p2, 18); \ 12487 __ret; \ 12488 }) 12489 #else 12490 #define vld1_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 12491 uint32x2_t __ret; \ 12492 uint32x2_t __s1 = __p1; \ 12493 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 12494 __ret = (uint32x2_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__rev1, __p2, 18); \ 12495 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 12496 __ret; \ 12497 }) 12498 #endif 12499 12500 #define vld1_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 12501 uint64x1_t __ret; \ 12502 uint64x1_t __s1 = __p1; \ 12503 __ret = (uint64x1_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__s1, __p2, 19); \ 12504 __ret; \ 12505 }) 12506 #ifdef __LITTLE_ENDIAN__ 12507 #define vld1_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 12508 uint16x4_t __ret; \ 12509 uint16x4_t __s1 = __p1; \ 12510 __ret = (uint16x4_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__s1, __p2, 17); \ 12511 __ret; \ 12512 }) 12513 #else 12514 #define vld1_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 12515 uint16x4_t __ret; \ 12516 uint16x4_t __s1 = __p1; \ 12517 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 12518 __ret = (uint16x4_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__rev1, __p2, 17); \ 12519 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 12520 __ret; \ 12521 }) 12522 #endif 12523 12524 #ifdef __LITTLE_ENDIAN__ 12525 #define vld1_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 12526 int8x8_t __ret; \ 12527 int8x8_t __s1 = __p1; \ 12528 __ret = (int8x8_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__s1, __p2, 0); \ 12529 __ret; \ 12530 }) 12531 #else 12532 #define vld1_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 12533 int8x8_t __ret; \ 12534 int8x8_t __s1 = __p1; \ 12535 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 12536 __ret = (int8x8_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__rev1, __p2, 0); \ 12537 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 12538 __ret; \ 12539 }) 12540 #endif 12541 12542 #ifdef __LITTLE_ENDIAN__ 12543 #define vld1_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 12544 float32x2_t __ret; \ 12545 float32x2_t __s1 = __p1; \ 12546 __ret = (float32x2_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__s1, __p2, 9); \ 12547 __ret; \ 12548 }) 12549 #else 12550 #define vld1_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 12551 float32x2_t __ret; \ 12552 float32x2_t __s1 = __p1; \ 12553 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 12554 __ret = (float32x2_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__rev1, __p2, 9); \ 12555 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 12556 __ret; \ 12557 }) 12558 #endif 12559 12560 #ifdef __LITTLE_ENDIAN__ 12561 #define vld1_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 12562 int32x2_t __ret; \ 12563 int32x2_t __s1 = __p1; \ 12564 __ret = (int32x2_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__s1, __p2, 2); \ 12565 __ret; \ 12566 }) 12567 #else 12568 #define vld1_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 12569 int32x2_t __ret; \ 12570 int32x2_t __s1 = __p1; \ 12571 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 12572 __ret = (int32x2_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__rev1, __p2, 2); \ 12573 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 12574 __ret; \ 12575 }) 12576 #endif 12577 12578 #define vld1_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 12579 int64x1_t __ret; \ 12580 int64x1_t __s1 = __p1; \ 12581 __ret = (int64x1_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__s1, __p2, 3); \ 12582 __ret; \ 12583 }) 12584 #ifdef __LITTLE_ENDIAN__ 12585 #define vld1_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 12586 int16x4_t __ret; \ 12587 int16x4_t __s1 = __p1; \ 12588 __ret = (int16x4_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__s1, __p2, 1); \ 12589 __ret; \ 12590 }) 12591 #else 12592 #define vld1_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 12593 int16x4_t __ret; \ 12594 int16x4_t __s1 = __p1; \ 12595 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 12596 __ret = (int16x4_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__rev1, __p2, 1); \ 12597 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 12598 __ret; \ 12599 }) 12600 #endif 12601 12602 #ifdef __LITTLE_ENDIAN__ 12603 #define vld1_p8_x2(__p0) __extension__ ({ \ 12604 poly8x8x2_t __ret; \ 12605 __builtin_neon_vld1_x2_v(&__ret, __p0, 4); \ 12606 __ret; \ 12607 }) 12608 #else 12609 #define vld1_p8_x2(__p0) __extension__ ({ \ 12610 poly8x8x2_t __ret; \ 12611 __builtin_neon_vld1_x2_v(&__ret, __p0, 4); \ 12612 \ 12613 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 12614 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 12615 __ret; \ 12616 }) 12617 #endif 12618 12619 #ifdef __LITTLE_ENDIAN__ 12620 #define vld1_p16_x2(__p0) __extension__ ({ \ 12621 poly16x4x2_t __ret; \ 12622 __builtin_neon_vld1_x2_v(&__ret, __p0, 5); \ 12623 __ret; \ 12624 }) 12625 #else 12626 #define vld1_p16_x2(__p0) __extension__ ({ \ 12627 poly16x4x2_t __ret; \ 12628 __builtin_neon_vld1_x2_v(&__ret, __p0, 5); \ 12629 \ 12630 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 12631 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 12632 __ret; \ 12633 }) 12634 #endif 12635 12636 #ifdef __LITTLE_ENDIAN__ 12637 #define vld1q_p8_x2(__p0) __extension__ ({ \ 12638 poly8x16x2_t __ret; \ 12639 __builtin_neon_vld1q_x2_v(&__ret, __p0, 36); \ 12640 __ret; \ 12641 }) 12642 #else 12643 #define vld1q_p8_x2(__p0) __extension__ ({ \ 12644 poly8x16x2_t __ret; \ 12645 __builtin_neon_vld1q_x2_v(&__ret, __p0, 36); \ 12646 \ 12647 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 12648 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 12649 __ret; \ 12650 }) 12651 #endif 12652 12653 #ifdef __LITTLE_ENDIAN__ 12654 #define vld1q_p16_x2(__p0) __extension__ ({ \ 12655 poly16x8x2_t __ret; \ 12656 __builtin_neon_vld1q_x2_v(&__ret, __p0, 37); \ 12657 __ret; \ 12658 }) 12659 #else 12660 #define vld1q_p16_x2(__p0) __extension__ ({ \ 12661 poly16x8x2_t __ret; \ 12662 __builtin_neon_vld1q_x2_v(&__ret, __p0, 37); \ 12663 \ 12664 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 12665 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 12666 __ret; \ 12667 }) 12668 #endif 12669 12670 #ifdef __LITTLE_ENDIAN__ 12671 #define vld1q_u8_x2(__p0) __extension__ ({ \ 12672 uint8x16x2_t __ret; \ 12673 __builtin_neon_vld1q_x2_v(&__ret, __p0, 48); \ 12674 __ret; \ 12675 }) 12676 #else 12677 #define vld1q_u8_x2(__p0) __extension__ ({ \ 12678 uint8x16x2_t __ret; \ 12679 __builtin_neon_vld1q_x2_v(&__ret, __p0, 48); \ 12680 \ 12681 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 12682 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 12683 __ret; \ 12684 }) 12685 #endif 12686 12687 #ifdef __LITTLE_ENDIAN__ 12688 #define vld1q_u32_x2(__p0) __extension__ ({ \ 12689 uint32x4x2_t __ret; \ 12690 __builtin_neon_vld1q_x2_v(&__ret, __p0, 50); \ 12691 __ret; \ 12692 }) 12693 #else 12694 #define vld1q_u32_x2(__p0) __extension__ ({ \ 12695 uint32x4x2_t __ret; \ 12696 __builtin_neon_vld1q_x2_v(&__ret, __p0, 50); \ 12697 \ 12698 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 12699 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 12700 __ret; \ 12701 }) 12702 #endif 12703 12704 #ifdef __LITTLE_ENDIAN__ 12705 #define vld1q_u64_x2(__p0) __extension__ ({ \ 12706 uint64x2x2_t __ret; \ 12707 __builtin_neon_vld1q_x2_v(&__ret, __p0, 51); \ 12708 __ret; \ 12709 }) 12710 #else 12711 #define vld1q_u64_x2(__p0) __extension__ ({ \ 12712 uint64x2x2_t __ret; \ 12713 __builtin_neon_vld1q_x2_v(&__ret, __p0, 51); \ 12714 \ 12715 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 12716 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 12717 __ret; \ 12718 }) 12719 #endif 12720 12721 #ifdef __LITTLE_ENDIAN__ 12722 #define vld1q_u16_x2(__p0) __extension__ ({ \ 12723 uint16x8x2_t __ret; \ 12724 __builtin_neon_vld1q_x2_v(&__ret, __p0, 49); \ 12725 __ret; \ 12726 }) 12727 #else 12728 #define vld1q_u16_x2(__p0) __extension__ ({ \ 12729 uint16x8x2_t __ret; \ 12730 __builtin_neon_vld1q_x2_v(&__ret, __p0, 49); \ 12731 \ 12732 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 12733 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 12734 __ret; \ 12735 }) 12736 #endif 12737 12738 #ifdef __LITTLE_ENDIAN__ 12739 #define vld1q_s8_x2(__p0) __extension__ ({ \ 12740 int8x16x2_t __ret; \ 12741 __builtin_neon_vld1q_x2_v(&__ret, __p0, 32); \ 12742 __ret; \ 12743 }) 12744 #else 12745 #define vld1q_s8_x2(__p0) __extension__ ({ \ 12746 int8x16x2_t __ret; \ 12747 __builtin_neon_vld1q_x2_v(&__ret, __p0, 32); \ 12748 \ 12749 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 12750 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 12751 __ret; \ 12752 }) 12753 #endif 12754 12755 #ifdef __LITTLE_ENDIAN__ 12756 #define vld1q_f32_x2(__p0) __extension__ ({ \ 12757 float32x4x2_t __ret; \ 12758 __builtin_neon_vld1q_x2_v(&__ret, __p0, 41); \ 12759 __ret; \ 12760 }) 12761 #else 12762 #define vld1q_f32_x2(__p0) __extension__ ({ \ 12763 float32x4x2_t __ret; \ 12764 __builtin_neon_vld1q_x2_v(&__ret, __p0, 41); \ 12765 \ 12766 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 12767 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 12768 __ret; \ 12769 }) 12770 #endif 12771 12772 #ifdef __LITTLE_ENDIAN__ 12773 #define vld1q_s32_x2(__p0) __extension__ ({ \ 12774 int32x4x2_t __ret; \ 12775 __builtin_neon_vld1q_x2_v(&__ret, __p0, 34); \ 12776 __ret; \ 12777 }) 12778 #else 12779 #define vld1q_s32_x2(__p0) __extension__ ({ \ 12780 int32x4x2_t __ret; \ 12781 __builtin_neon_vld1q_x2_v(&__ret, __p0, 34); \ 12782 \ 12783 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 12784 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 12785 __ret; \ 12786 }) 12787 #endif 12788 12789 #ifdef __LITTLE_ENDIAN__ 12790 #define vld1q_s64_x2(__p0) __extension__ ({ \ 12791 int64x2x2_t __ret; \ 12792 __builtin_neon_vld1q_x2_v(&__ret, __p0, 35); \ 12793 __ret; \ 12794 }) 12795 #else 12796 #define vld1q_s64_x2(__p0) __extension__ ({ \ 12797 int64x2x2_t __ret; \ 12798 __builtin_neon_vld1q_x2_v(&__ret, __p0, 35); \ 12799 \ 12800 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 12801 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 12802 __ret; \ 12803 }) 12804 #endif 12805 12806 #ifdef __LITTLE_ENDIAN__ 12807 #define vld1q_s16_x2(__p0) __extension__ ({ \ 12808 int16x8x2_t __ret; \ 12809 __builtin_neon_vld1q_x2_v(&__ret, __p0, 33); \ 12810 __ret; \ 12811 }) 12812 #else 12813 #define vld1q_s16_x2(__p0) __extension__ ({ \ 12814 int16x8x2_t __ret; \ 12815 __builtin_neon_vld1q_x2_v(&__ret, __p0, 33); \ 12816 \ 12817 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 12818 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 12819 __ret; \ 12820 }) 12821 #endif 12822 12823 #ifdef __LITTLE_ENDIAN__ 12824 #define vld1_u8_x2(__p0) __extension__ ({ \ 12825 uint8x8x2_t __ret; \ 12826 __builtin_neon_vld1_x2_v(&__ret, __p0, 16); \ 12827 __ret; \ 12828 }) 12829 #else 12830 #define vld1_u8_x2(__p0) __extension__ ({ \ 12831 uint8x8x2_t __ret; \ 12832 __builtin_neon_vld1_x2_v(&__ret, __p0, 16); \ 12833 \ 12834 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 12835 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 12836 __ret; \ 12837 }) 12838 #endif 12839 12840 #ifdef __LITTLE_ENDIAN__ 12841 #define vld1_u32_x2(__p0) __extension__ ({ \ 12842 uint32x2x2_t __ret; \ 12843 __builtin_neon_vld1_x2_v(&__ret, __p0, 18); \ 12844 __ret; \ 12845 }) 12846 #else 12847 #define vld1_u32_x2(__p0) __extension__ ({ \ 12848 uint32x2x2_t __ret; \ 12849 __builtin_neon_vld1_x2_v(&__ret, __p0, 18); \ 12850 \ 12851 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 12852 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 12853 __ret; \ 12854 }) 12855 #endif 12856 12857 #define vld1_u64_x2(__p0) __extension__ ({ \ 12858 uint64x1x2_t __ret; \ 12859 __builtin_neon_vld1_x2_v(&__ret, __p0, 19); \ 12860 __ret; \ 12861 }) 12862 #ifdef __LITTLE_ENDIAN__ 12863 #define vld1_u16_x2(__p0) __extension__ ({ \ 12864 uint16x4x2_t __ret; \ 12865 __builtin_neon_vld1_x2_v(&__ret, __p0, 17); \ 12866 __ret; \ 12867 }) 12868 #else 12869 #define vld1_u16_x2(__p0) __extension__ ({ \ 12870 uint16x4x2_t __ret; \ 12871 __builtin_neon_vld1_x2_v(&__ret, __p0, 17); \ 12872 \ 12873 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 12874 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 12875 __ret; \ 12876 }) 12877 #endif 12878 12879 #ifdef __LITTLE_ENDIAN__ 12880 #define vld1_s8_x2(__p0) __extension__ ({ \ 12881 int8x8x2_t __ret; \ 12882 __builtin_neon_vld1_x2_v(&__ret, __p0, 0); \ 12883 __ret; \ 12884 }) 12885 #else 12886 #define vld1_s8_x2(__p0) __extension__ ({ \ 12887 int8x8x2_t __ret; \ 12888 __builtin_neon_vld1_x2_v(&__ret, __p0, 0); \ 12889 \ 12890 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 12891 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 12892 __ret; \ 12893 }) 12894 #endif 12895 12896 #ifdef __LITTLE_ENDIAN__ 12897 #define vld1_f32_x2(__p0) __extension__ ({ \ 12898 float32x2x2_t __ret; \ 12899 __builtin_neon_vld1_x2_v(&__ret, __p0, 9); \ 12900 __ret; \ 12901 }) 12902 #else 12903 #define vld1_f32_x2(__p0) __extension__ ({ \ 12904 float32x2x2_t __ret; \ 12905 __builtin_neon_vld1_x2_v(&__ret, __p0, 9); \ 12906 \ 12907 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 12908 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 12909 __ret; \ 12910 }) 12911 #endif 12912 12913 #ifdef __LITTLE_ENDIAN__ 12914 #define vld1_s32_x2(__p0) __extension__ ({ \ 12915 int32x2x2_t __ret; \ 12916 __builtin_neon_vld1_x2_v(&__ret, __p0, 2); \ 12917 __ret; \ 12918 }) 12919 #else 12920 #define vld1_s32_x2(__p0) __extension__ ({ \ 12921 int32x2x2_t __ret; \ 12922 __builtin_neon_vld1_x2_v(&__ret, __p0, 2); \ 12923 \ 12924 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 12925 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 12926 __ret; \ 12927 }) 12928 #endif 12929 12930 #define vld1_s64_x2(__p0) __extension__ ({ \ 12931 int64x1x2_t __ret; \ 12932 __builtin_neon_vld1_x2_v(&__ret, __p0, 3); \ 12933 __ret; \ 12934 }) 12935 #ifdef __LITTLE_ENDIAN__ 12936 #define vld1_s16_x2(__p0) __extension__ ({ \ 12937 int16x4x2_t __ret; \ 12938 __builtin_neon_vld1_x2_v(&__ret, __p0, 1); \ 12939 __ret; \ 12940 }) 12941 #else 12942 #define vld1_s16_x2(__p0) __extension__ ({ \ 12943 int16x4x2_t __ret; \ 12944 __builtin_neon_vld1_x2_v(&__ret, __p0, 1); \ 12945 \ 12946 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 12947 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 12948 __ret; \ 12949 }) 12950 #endif 12951 12952 #ifdef __LITTLE_ENDIAN__ 12953 #define vld1_p8_x3(__p0) __extension__ ({ \ 12954 poly8x8x3_t __ret; \ 12955 __builtin_neon_vld1_x3_v(&__ret, __p0, 4); \ 12956 __ret; \ 12957 }) 12958 #else 12959 #define vld1_p8_x3(__p0) __extension__ ({ \ 12960 poly8x8x3_t __ret; \ 12961 __builtin_neon_vld1_x3_v(&__ret, __p0, 4); \ 12962 \ 12963 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 12964 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 12965 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 12966 __ret; \ 12967 }) 12968 #endif 12969 12970 #ifdef __LITTLE_ENDIAN__ 12971 #define vld1_p16_x3(__p0) __extension__ ({ \ 12972 poly16x4x3_t __ret; \ 12973 __builtin_neon_vld1_x3_v(&__ret, __p0, 5); \ 12974 __ret; \ 12975 }) 12976 #else 12977 #define vld1_p16_x3(__p0) __extension__ ({ \ 12978 poly16x4x3_t __ret; \ 12979 __builtin_neon_vld1_x3_v(&__ret, __p0, 5); \ 12980 \ 12981 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 12982 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 12983 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 12984 __ret; \ 12985 }) 12986 #endif 12987 12988 #ifdef __LITTLE_ENDIAN__ 12989 #define vld1q_p8_x3(__p0) __extension__ ({ \ 12990 poly8x16x3_t __ret; \ 12991 __builtin_neon_vld1q_x3_v(&__ret, __p0, 36); \ 12992 __ret; \ 12993 }) 12994 #else 12995 #define vld1q_p8_x3(__p0) __extension__ ({ \ 12996 poly8x16x3_t __ret; \ 12997 __builtin_neon_vld1q_x3_v(&__ret, __p0, 36); \ 12998 \ 12999 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 13000 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 13001 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 13002 __ret; \ 13003 }) 13004 #endif 13005 13006 #ifdef __LITTLE_ENDIAN__ 13007 #define vld1q_p16_x3(__p0) __extension__ ({ \ 13008 poly16x8x3_t __ret; \ 13009 __builtin_neon_vld1q_x3_v(&__ret, __p0, 37); \ 13010 __ret; \ 13011 }) 13012 #else 13013 #define vld1q_p16_x3(__p0) __extension__ ({ \ 13014 poly16x8x3_t __ret; \ 13015 __builtin_neon_vld1q_x3_v(&__ret, __p0, 37); \ 13016 \ 13017 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 13018 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 13019 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 13020 __ret; \ 13021 }) 13022 #endif 13023 13024 #ifdef __LITTLE_ENDIAN__ 13025 #define vld1q_u8_x3(__p0) __extension__ ({ \ 13026 uint8x16x3_t __ret; \ 13027 __builtin_neon_vld1q_x3_v(&__ret, __p0, 48); \ 13028 __ret; \ 13029 }) 13030 #else 13031 #define vld1q_u8_x3(__p0) __extension__ ({ \ 13032 uint8x16x3_t __ret; \ 13033 __builtin_neon_vld1q_x3_v(&__ret, __p0, 48); \ 13034 \ 13035 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 13036 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 13037 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 13038 __ret; \ 13039 }) 13040 #endif 13041 13042 #ifdef __LITTLE_ENDIAN__ 13043 #define vld1q_u32_x3(__p0) __extension__ ({ \ 13044 uint32x4x3_t __ret; \ 13045 __builtin_neon_vld1q_x3_v(&__ret, __p0, 50); \ 13046 __ret; \ 13047 }) 13048 #else 13049 #define vld1q_u32_x3(__p0) __extension__ ({ \ 13050 uint32x4x3_t __ret; \ 13051 __builtin_neon_vld1q_x3_v(&__ret, __p0, 50); \ 13052 \ 13053 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 13054 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 13055 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 13056 __ret; \ 13057 }) 13058 #endif 13059 13060 #ifdef __LITTLE_ENDIAN__ 13061 #define vld1q_u64_x3(__p0) __extension__ ({ \ 13062 uint64x2x3_t __ret; \ 13063 __builtin_neon_vld1q_x3_v(&__ret, __p0, 51); \ 13064 __ret; \ 13065 }) 13066 #else 13067 #define vld1q_u64_x3(__p0) __extension__ ({ \ 13068 uint64x2x3_t __ret; \ 13069 __builtin_neon_vld1q_x3_v(&__ret, __p0, 51); \ 13070 \ 13071 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 13072 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 13073 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 13074 __ret; \ 13075 }) 13076 #endif 13077 13078 #ifdef __LITTLE_ENDIAN__ 13079 #define vld1q_u16_x3(__p0) __extension__ ({ \ 13080 uint16x8x3_t __ret; \ 13081 __builtin_neon_vld1q_x3_v(&__ret, __p0, 49); \ 13082 __ret; \ 13083 }) 13084 #else 13085 #define vld1q_u16_x3(__p0) __extension__ ({ \ 13086 uint16x8x3_t __ret; \ 13087 __builtin_neon_vld1q_x3_v(&__ret, __p0, 49); \ 13088 \ 13089 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 13090 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 13091 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 13092 __ret; \ 13093 }) 13094 #endif 13095 13096 #ifdef __LITTLE_ENDIAN__ 13097 #define vld1q_s8_x3(__p0) __extension__ ({ \ 13098 int8x16x3_t __ret; \ 13099 __builtin_neon_vld1q_x3_v(&__ret, __p0, 32); \ 13100 __ret; \ 13101 }) 13102 #else 13103 #define vld1q_s8_x3(__p0) __extension__ ({ \ 13104 int8x16x3_t __ret; \ 13105 __builtin_neon_vld1q_x3_v(&__ret, __p0, 32); \ 13106 \ 13107 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 13108 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 13109 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 13110 __ret; \ 13111 }) 13112 #endif 13113 13114 #ifdef __LITTLE_ENDIAN__ 13115 #define vld1q_f32_x3(__p0) __extension__ ({ \ 13116 float32x4x3_t __ret; \ 13117 __builtin_neon_vld1q_x3_v(&__ret, __p0, 41); \ 13118 __ret; \ 13119 }) 13120 #else 13121 #define vld1q_f32_x3(__p0) __extension__ ({ \ 13122 float32x4x3_t __ret; \ 13123 __builtin_neon_vld1q_x3_v(&__ret, __p0, 41); \ 13124 \ 13125 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 13126 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 13127 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 13128 __ret; \ 13129 }) 13130 #endif 13131 13132 #ifdef __LITTLE_ENDIAN__ 13133 #define vld1q_s32_x3(__p0) __extension__ ({ \ 13134 int32x4x3_t __ret; \ 13135 __builtin_neon_vld1q_x3_v(&__ret, __p0, 34); \ 13136 __ret; \ 13137 }) 13138 #else 13139 #define vld1q_s32_x3(__p0) __extension__ ({ \ 13140 int32x4x3_t __ret; \ 13141 __builtin_neon_vld1q_x3_v(&__ret, __p0, 34); \ 13142 \ 13143 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 13144 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 13145 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 13146 __ret; \ 13147 }) 13148 #endif 13149 13150 #ifdef __LITTLE_ENDIAN__ 13151 #define vld1q_s64_x3(__p0) __extension__ ({ \ 13152 int64x2x3_t __ret; \ 13153 __builtin_neon_vld1q_x3_v(&__ret, __p0, 35); \ 13154 __ret; \ 13155 }) 13156 #else 13157 #define vld1q_s64_x3(__p0) __extension__ ({ \ 13158 int64x2x3_t __ret; \ 13159 __builtin_neon_vld1q_x3_v(&__ret, __p0, 35); \ 13160 \ 13161 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 13162 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 13163 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 13164 __ret; \ 13165 }) 13166 #endif 13167 13168 #ifdef __LITTLE_ENDIAN__ 13169 #define vld1q_s16_x3(__p0) __extension__ ({ \ 13170 int16x8x3_t __ret; \ 13171 __builtin_neon_vld1q_x3_v(&__ret, __p0, 33); \ 13172 __ret; \ 13173 }) 13174 #else 13175 #define vld1q_s16_x3(__p0) __extension__ ({ \ 13176 int16x8x3_t __ret; \ 13177 __builtin_neon_vld1q_x3_v(&__ret, __p0, 33); \ 13178 \ 13179 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 13180 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 13181 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 13182 __ret; \ 13183 }) 13184 #endif 13185 13186 #ifdef __LITTLE_ENDIAN__ 13187 #define vld1_u8_x3(__p0) __extension__ ({ \ 13188 uint8x8x3_t __ret; \ 13189 __builtin_neon_vld1_x3_v(&__ret, __p0, 16); \ 13190 __ret; \ 13191 }) 13192 #else 13193 #define vld1_u8_x3(__p0) __extension__ ({ \ 13194 uint8x8x3_t __ret; \ 13195 __builtin_neon_vld1_x3_v(&__ret, __p0, 16); \ 13196 \ 13197 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 13198 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 13199 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 13200 __ret; \ 13201 }) 13202 #endif 13203 13204 #ifdef __LITTLE_ENDIAN__ 13205 #define vld1_u32_x3(__p0) __extension__ ({ \ 13206 uint32x2x3_t __ret; \ 13207 __builtin_neon_vld1_x3_v(&__ret, __p0, 18); \ 13208 __ret; \ 13209 }) 13210 #else 13211 #define vld1_u32_x3(__p0) __extension__ ({ \ 13212 uint32x2x3_t __ret; \ 13213 __builtin_neon_vld1_x3_v(&__ret, __p0, 18); \ 13214 \ 13215 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 13216 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 13217 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 13218 __ret; \ 13219 }) 13220 #endif 13221 13222 #define vld1_u64_x3(__p0) __extension__ ({ \ 13223 uint64x1x3_t __ret; \ 13224 __builtin_neon_vld1_x3_v(&__ret, __p0, 19); \ 13225 __ret; \ 13226 }) 13227 #ifdef __LITTLE_ENDIAN__ 13228 #define vld1_u16_x3(__p0) __extension__ ({ \ 13229 uint16x4x3_t __ret; \ 13230 __builtin_neon_vld1_x3_v(&__ret, __p0, 17); \ 13231 __ret; \ 13232 }) 13233 #else 13234 #define vld1_u16_x3(__p0) __extension__ ({ \ 13235 uint16x4x3_t __ret; \ 13236 __builtin_neon_vld1_x3_v(&__ret, __p0, 17); \ 13237 \ 13238 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 13239 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 13240 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 13241 __ret; \ 13242 }) 13243 #endif 13244 13245 #ifdef __LITTLE_ENDIAN__ 13246 #define vld1_s8_x3(__p0) __extension__ ({ \ 13247 int8x8x3_t __ret; \ 13248 __builtin_neon_vld1_x3_v(&__ret, __p0, 0); \ 13249 __ret; \ 13250 }) 13251 #else 13252 #define vld1_s8_x3(__p0) __extension__ ({ \ 13253 int8x8x3_t __ret; \ 13254 __builtin_neon_vld1_x3_v(&__ret, __p0, 0); \ 13255 \ 13256 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 13257 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 13258 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 13259 __ret; \ 13260 }) 13261 #endif 13262 13263 #ifdef __LITTLE_ENDIAN__ 13264 #define vld1_f32_x3(__p0) __extension__ ({ \ 13265 float32x2x3_t __ret; \ 13266 __builtin_neon_vld1_x3_v(&__ret, __p0, 9); \ 13267 __ret; \ 13268 }) 13269 #else 13270 #define vld1_f32_x3(__p0) __extension__ ({ \ 13271 float32x2x3_t __ret; \ 13272 __builtin_neon_vld1_x3_v(&__ret, __p0, 9); \ 13273 \ 13274 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 13275 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 13276 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 13277 __ret; \ 13278 }) 13279 #endif 13280 13281 #ifdef __LITTLE_ENDIAN__ 13282 #define vld1_s32_x3(__p0) __extension__ ({ \ 13283 int32x2x3_t __ret; \ 13284 __builtin_neon_vld1_x3_v(&__ret, __p0, 2); \ 13285 __ret; \ 13286 }) 13287 #else 13288 #define vld1_s32_x3(__p0) __extension__ ({ \ 13289 int32x2x3_t __ret; \ 13290 __builtin_neon_vld1_x3_v(&__ret, __p0, 2); \ 13291 \ 13292 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 13293 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 13294 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 13295 __ret; \ 13296 }) 13297 #endif 13298 13299 #define vld1_s64_x3(__p0) __extension__ ({ \ 13300 int64x1x3_t __ret; \ 13301 __builtin_neon_vld1_x3_v(&__ret, __p0, 3); \ 13302 __ret; \ 13303 }) 13304 #ifdef __LITTLE_ENDIAN__ 13305 #define vld1_s16_x3(__p0) __extension__ ({ \ 13306 int16x4x3_t __ret; \ 13307 __builtin_neon_vld1_x3_v(&__ret, __p0, 1); \ 13308 __ret; \ 13309 }) 13310 #else 13311 #define vld1_s16_x3(__p0) __extension__ ({ \ 13312 int16x4x3_t __ret; \ 13313 __builtin_neon_vld1_x3_v(&__ret, __p0, 1); \ 13314 \ 13315 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 13316 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 13317 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 13318 __ret; \ 13319 }) 13320 #endif 13321 13322 #ifdef __LITTLE_ENDIAN__ 13323 #define vld1_p8_x4(__p0) __extension__ ({ \ 13324 poly8x8x4_t __ret; \ 13325 __builtin_neon_vld1_x4_v(&__ret, __p0, 4); \ 13326 __ret; \ 13327 }) 13328 #else 13329 #define vld1_p8_x4(__p0) __extension__ ({ \ 13330 poly8x8x4_t __ret; \ 13331 __builtin_neon_vld1_x4_v(&__ret, __p0, 4); \ 13332 \ 13333 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 13334 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 13335 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 13336 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 13337 __ret; \ 13338 }) 13339 #endif 13340 13341 #ifdef __LITTLE_ENDIAN__ 13342 #define vld1_p16_x4(__p0) __extension__ ({ \ 13343 poly16x4x4_t __ret; \ 13344 __builtin_neon_vld1_x4_v(&__ret, __p0, 5); \ 13345 __ret; \ 13346 }) 13347 #else 13348 #define vld1_p16_x4(__p0) __extension__ ({ \ 13349 poly16x4x4_t __ret; \ 13350 __builtin_neon_vld1_x4_v(&__ret, __p0, 5); \ 13351 \ 13352 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 13353 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 13354 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 13355 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \ 13356 __ret; \ 13357 }) 13358 #endif 13359 13360 #ifdef __LITTLE_ENDIAN__ 13361 #define vld1q_p8_x4(__p0) __extension__ ({ \ 13362 poly8x16x4_t __ret; \ 13363 __builtin_neon_vld1q_x4_v(&__ret, __p0, 36); \ 13364 __ret; \ 13365 }) 13366 #else 13367 #define vld1q_p8_x4(__p0) __extension__ ({ \ 13368 poly8x16x4_t __ret; \ 13369 __builtin_neon_vld1q_x4_v(&__ret, __p0, 36); \ 13370 \ 13371 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 13372 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 13373 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 13374 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 13375 __ret; \ 13376 }) 13377 #endif 13378 13379 #ifdef __LITTLE_ENDIAN__ 13380 #define vld1q_p16_x4(__p0) __extension__ ({ \ 13381 poly16x8x4_t __ret; \ 13382 __builtin_neon_vld1q_x4_v(&__ret, __p0, 37); \ 13383 __ret; \ 13384 }) 13385 #else 13386 #define vld1q_p16_x4(__p0) __extension__ ({ \ 13387 poly16x8x4_t __ret; \ 13388 __builtin_neon_vld1q_x4_v(&__ret, __p0, 37); \ 13389 \ 13390 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 13391 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 13392 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 13393 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 13394 __ret; \ 13395 }) 13396 #endif 13397 13398 #ifdef __LITTLE_ENDIAN__ 13399 #define vld1q_u8_x4(__p0) __extension__ ({ \ 13400 uint8x16x4_t __ret; \ 13401 __builtin_neon_vld1q_x4_v(&__ret, __p0, 48); \ 13402 __ret; \ 13403 }) 13404 #else 13405 #define vld1q_u8_x4(__p0) __extension__ ({ \ 13406 uint8x16x4_t __ret; \ 13407 __builtin_neon_vld1q_x4_v(&__ret, __p0, 48); \ 13408 \ 13409 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 13410 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 13411 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 13412 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 13413 __ret; \ 13414 }) 13415 #endif 13416 13417 #ifdef __LITTLE_ENDIAN__ 13418 #define vld1q_u32_x4(__p0) __extension__ ({ \ 13419 uint32x4x4_t __ret; \ 13420 __builtin_neon_vld1q_x4_v(&__ret, __p0, 50); \ 13421 __ret; \ 13422 }) 13423 #else 13424 #define vld1q_u32_x4(__p0) __extension__ ({ \ 13425 uint32x4x4_t __ret; \ 13426 __builtin_neon_vld1q_x4_v(&__ret, __p0, 50); \ 13427 \ 13428 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 13429 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 13430 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 13431 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \ 13432 __ret; \ 13433 }) 13434 #endif 13435 13436 #ifdef __LITTLE_ENDIAN__ 13437 #define vld1q_u64_x4(__p0) __extension__ ({ \ 13438 uint64x2x4_t __ret; \ 13439 __builtin_neon_vld1q_x4_v(&__ret, __p0, 51); \ 13440 __ret; \ 13441 }) 13442 #else 13443 #define vld1q_u64_x4(__p0) __extension__ ({ \ 13444 uint64x2x4_t __ret; \ 13445 __builtin_neon_vld1q_x4_v(&__ret, __p0, 51); \ 13446 \ 13447 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 13448 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 13449 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 13450 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \ 13451 __ret; \ 13452 }) 13453 #endif 13454 13455 #ifdef __LITTLE_ENDIAN__ 13456 #define vld1q_u16_x4(__p0) __extension__ ({ \ 13457 uint16x8x4_t __ret; \ 13458 __builtin_neon_vld1q_x4_v(&__ret, __p0, 49); \ 13459 __ret; \ 13460 }) 13461 #else 13462 #define vld1q_u16_x4(__p0) __extension__ ({ \ 13463 uint16x8x4_t __ret; \ 13464 __builtin_neon_vld1q_x4_v(&__ret, __p0, 49); \ 13465 \ 13466 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 13467 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 13468 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 13469 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 13470 __ret; \ 13471 }) 13472 #endif 13473 13474 #ifdef __LITTLE_ENDIAN__ 13475 #define vld1q_s8_x4(__p0) __extension__ ({ \ 13476 int8x16x4_t __ret; \ 13477 __builtin_neon_vld1q_x4_v(&__ret, __p0, 32); \ 13478 __ret; \ 13479 }) 13480 #else 13481 #define vld1q_s8_x4(__p0) __extension__ ({ \ 13482 int8x16x4_t __ret; \ 13483 __builtin_neon_vld1q_x4_v(&__ret, __p0, 32); \ 13484 \ 13485 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 13486 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 13487 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 13488 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 13489 __ret; \ 13490 }) 13491 #endif 13492 13493 #ifdef __LITTLE_ENDIAN__ 13494 #define vld1q_f32_x4(__p0) __extension__ ({ \ 13495 float32x4x4_t __ret; \ 13496 __builtin_neon_vld1q_x4_v(&__ret, __p0, 41); \ 13497 __ret; \ 13498 }) 13499 #else 13500 #define vld1q_f32_x4(__p0) __extension__ ({ \ 13501 float32x4x4_t __ret; \ 13502 __builtin_neon_vld1q_x4_v(&__ret, __p0, 41); \ 13503 \ 13504 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 13505 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 13506 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 13507 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \ 13508 __ret; \ 13509 }) 13510 #endif 13511 13512 #ifdef __LITTLE_ENDIAN__ 13513 #define vld1q_s32_x4(__p0) __extension__ ({ \ 13514 int32x4x4_t __ret; \ 13515 __builtin_neon_vld1q_x4_v(&__ret, __p0, 34); \ 13516 __ret; \ 13517 }) 13518 #else 13519 #define vld1q_s32_x4(__p0) __extension__ ({ \ 13520 int32x4x4_t __ret; \ 13521 __builtin_neon_vld1q_x4_v(&__ret, __p0, 34); \ 13522 \ 13523 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 13524 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 13525 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 13526 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \ 13527 __ret; \ 13528 }) 13529 #endif 13530 13531 #ifdef __LITTLE_ENDIAN__ 13532 #define vld1q_s64_x4(__p0) __extension__ ({ \ 13533 int64x2x4_t __ret; \ 13534 __builtin_neon_vld1q_x4_v(&__ret, __p0, 35); \ 13535 __ret; \ 13536 }) 13537 #else 13538 #define vld1q_s64_x4(__p0) __extension__ ({ \ 13539 int64x2x4_t __ret; \ 13540 __builtin_neon_vld1q_x4_v(&__ret, __p0, 35); \ 13541 \ 13542 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 13543 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 13544 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 13545 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \ 13546 __ret; \ 13547 }) 13548 #endif 13549 13550 #ifdef __LITTLE_ENDIAN__ 13551 #define vld1q_s16_x4(__p0) __extension__ ({ \ 13552 int16x8x4_t __ret; \ 13553 __builtin_neon_vld1q_x4_v(&__ret, __p0, 33); \ 13554 __ret; \ 13555 }) 13556 #else 13557 #define vld1q_s16_x4(__p0) __extension__ ({ \ 13558 int16x8x4_t __ret; \ 13559 __builtin_neon_vld1q_x4_v(&__ret, __p0, 33); \ 13560 \ 13561 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 13562 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 13563 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 13564 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 13565 __ret; \ 13566 }) 13567 #endif 13568 13569 #ifdef __LITTLE_ENDIAN__ 13570 #define vld1_u8_x4(__p0) __extension__ ({ \ 13571 uint8x8x4_t __ret; \ 13572 __builtin_neon_vld1_x4_v(&__ret, __p0, 16); \ 13573 __ret; \ 13574 }) 13575 #else 13576 #define vld1_u8_x4(__p0) __extension__ ({ \ 13577 uint8x8x4_t __ret; \ 13578 __builtin_neon_vld1_x4_v(&__ret, __p0, 16); \ 13579 \ 13580 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 13581 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 13582 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 13583 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 13584 __ret; \ 13585 }) 13586 #endif 13587 13588 #ifdef __LITTLE_ENDIAN__ 13589 #define vld1_u32_x4(__p0) __extension__ ({ \ 13590 uint32x2x4_t __ret; \ 13591 __builtin_neon_vld1_x4_v(&__ret, __p0, 18); \ 13592 __ret; \ 13593 }) 13594 #else 13595 #define vld1_u32_x4(__p0) __extension__ ({ \ 13596 uint32x2x4_t __ret; \ 13597 __builtin_neon_vld1_x4_v(&__ret, __p0, 18); \ 13598 \ 13599 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 13600 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 13601 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 13602 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \ 13603 __ret; \ 13604 }) 13605 #endif 13606 13607 #define vld1_u64_x4(__p0) __extension__ ({ \ 13608 uint64x1x4_t __ret; \ 13609 __builtin_neon_vld1_x4_v(&__ret, __p0, 19); \ 13610 __ret; \ 13611 }) 13612 #ifdef __LITTLE_ENDIAN__ 13613 #define vld1_u16_x4(__p0) __extension__ ({ \ 13614 uint16x4x4_t __ret; \ 13615 __builtin_neon_vld1_x4_v(&__ret, __p0, 17); \ 13616 __ret; \ 13617 }) 13618 #else 13619 #define vld1_u16_x4(__p0) __extension__ ({ \ 13620 uint16x4x4_t __ret; \ 13621 __builtin_neon_vld1_x4_v(&__ret, __p0, 17); \ 13622 \ 13623 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 13624 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 13625 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 13626 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \ 13627 __ret; \ 13628 }) 13629 #endif 13630 13631 #ifdef __LITTLE_ENDIAN__ 13632 #define vld1_s8_x4(__p0) __extension__ ({ \ 13633 int8x8x4_t __ret; \ 13634 __builtin_neon_vld1_x4_v(&__ret, __p0, 0); \ 13635 __ret; \ 13636 }) 13637 #else 13638 #define vld1_s8_x4(__p0) __extension__ ({ \ 13639 int8x8x4_t __ret; \ 13640 __builtin_neon_vld1_x4_v(&__ret, __p0, 0); \ 13641 \ 13642 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 13643 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 13644 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 13645 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 13646 __ret; \ 13647 }) 13648 #endif 13649 13650 #ifdef __LITTLE_ENDIAN__ 13651 #define vld1_f32_x4(__p0) __extension__ ({ \ 13652 float32x2x4_t __ret; \ 13653 __builtin_neon_vld1_x4_v(&__ret, __p0, 9); \ 13654 __ret; \ 13655 }) 13656 #else 13657 #define vld1_f32_x4(__p0) __extension__ ({ \ 13658 float32x2x4_t __ret; \ 13659 __builtin_neon_vld1_x4_v(&__ret, __p0, 9); \ 13660 \ 13661 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 13662 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 13663 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 13664 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \ 13665 __ret; \ 13666 }) 13667 #endif 13668 13669 #ifdef __LITTLE_ENDIAN__ 13670 #define vld1_s32_x4(__p0) __extension__ ({ \ 13671 int32x2x4_t __ret; \ 13672 __builtin_neon_vld1_x4_v(&__ret, __p0, 2); \ 13673 __ret; \ 13674 }) 13675 #else 13676 #define vld1_s32_x4(__p0) __extension__ ({ \ 13677 int32x2x4_t __ret; \ 13678 __builtin_neon_vld1_x4_v(&__ret, __p0, 2); \ 13679 \ 13680 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 13681 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 13682 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 13683 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \ 13684 __ret; \ 13685 }) 13686 #endif 13687 13688 #define vld1_s64_x4(__p0) __extension__ ({ \ 13689 int64x1x4_t __ret; \ 13690 __builtin_neon_vld1_x4_v(&__ret, __p0, 3); \ 13691 __ret; \ 13692 }) 13693 #ifdef __LITTLE_ENDIAN__ 13694 #define vld1_s16_x4(__p0) __extension__ ({ \ 13695 int16x4x4_t __ret; \ 13696 __builtin_neon_vld1_x4_v(&__ret, __p0, 1); \ 13697 __ret; \ 13698 }) 13699 #else 13700 #define vld1_s16_x4(__p0) __extension__ ({ \ 13701 int16x4x4_t __ret; \ 13702 __builtin_neon_vld1_x4_v(&__ret, __p0, 1); \ 13703 \ 13704 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 13705 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 13706 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 13707 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \ 13708 __ret; \ 13709 }) 13710 #endif 13711 13712 #ifdef __LITTLE_ENDIAN__ 13713 #define vld2_p8(__p0) __extension__ ({ \ 13714 poly8x8x2_t __ret; \ 13715 __builtin_neon_vld2_v(&__ret, __p0, 4); \ 13716 __ret; \ 13717 }) 13718 #else 13719 #define vld2_p8(__p0) __extension__ ({ \ 13720 poly8x8x2_t __ret; \ 13721 __builtin_neon_vld2_v(&__ret, __p0, 4); \ 13722 \ 13723 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 13724 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 13725 __ret; \ 13726 }) 13727 #endif 13728 13729 #ifdef __LITTLE_ENDIAN__ 13730 #define vld2_p16(__p0) __extension__ ({ \ 13731 poly16x4x2_t __ret; \ 13732 __builtin_neon_vld2_v(&__ret, __p0, 5); \ 13733 __ret; \ 13734 }) 13735 #else 13736 #define vld2_p16(__p0) __extension__ ({ \ 13737 poly16x4x2_t __ret; \ 13738 __builtin_neon_vld2_v(&__ret, __p0, 5); \ 13739 \ 13740 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 13741 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 13742 __ret; \ 13743 }) 13744 #endif 13745 13746 #ifdef __LITTLE_ENDIAN__ 13747 #define vld2q_p8(__p0) __extension__ ({ \ 13748 poly8x16x2_t __ret; \ 13749 __builtin_neon_vld2q_v(&__ret, __p0, 36); \ 13750 __ret; \ 13751 }) 13752 #else 13753 #define vld2q_p8(__p0) __extension__ ({ \ 13754 poly8x16x2_t __ret; \ 13755 __builtin_neon_vld2q_v(&__ret, __p0, 36); \ 13756 \ 13757 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 13758 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 13759 __ret; \ 13760 }) 13761 #endif 13762 13763 #ifdef __LITTLE_ENDIAN__ 13764 #define vld2q_p16(__p0) __extension__ ({ \ 13765 poly16x8x2_t __ret; \ 13766 __builtin_neon_vld2q_v(&__ret, __p0, 37); \ 13767 __ret; \ 13768 }) 13769 #else 13770 #define vld2q_p16(__p0) __extension__ ({ \ 13771 poly16x8x2_t __ret; \ 13772 __builtin_neon_vld2q_v(&__ret, __p0, 37); \ 13773 \ 13774 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 13775 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 13776 __ret; \ 13777 }) 13778 #endif 13779 13780 #ifdef __LITTLE_ENDIAN__ 13781 #define vld2q_u8(__p0) __extension__ ({ \ 13782 uint8x16x2_t __ret; \ 13783 __builtin_neon_vld2q_v(&__ret, __p0, 48); \ 13784 __ret; \ 13785 }) 13786 #else 13787 #define vld2q_u8(__p0) __extension__ ({ \ 13788 uint8x16x2_t __ret; \ 13789 __builtin_neon_vld2q_v(&__ret, __p0, 48); \ 13790 \ 13791 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 13792 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 13793 __ret; \ 13794 }) 13795 #endif 13796 13797 #ifdef __LITTLE_ENDIAN__ 13798 #define vld2q_u32(__p0) __extension__ ({ \ 13799 uint32x4x2_t __ret; \ 13800 __builtin_neon_vld2q_v(&__ret, __p0, 50); \ 13801 __ret; \ 13802 }) 13803 #else 13804 #define vld2q_u32(__p0) __extension__ ({ \ 13805 uint32x4x2_t __ret; \ 13806 __builtin_neon_vld2q_v(&__ret, __p0, 50); \ 13807 \ 13808 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 13809 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 13810 __ret; \ 13811 }) 13812 #endif 13813 13814 #ifdef __LITTLE_ENDIAN__ 13815 #define vld2q_u16(__p0) __extension__ ({ \ 13816 uint16x8x2_t __ret; \ 13817 __builtin_neon_vld2q_v(&__ret, __p0, 49); \ 13818 __ret; \ 13819 }) 13820 #else 13821 #define vld2q_u16(__p0) __extension__ ({ \ 13822 uint16x8x2_t __ret; \ 13823 __builtin_neon_vld2q_v(&__ret, __p0, 49); \ 13824 \ 13825 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 13826 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 13827 __ret; \ 13828 }) 13829 #endif 13830 13831 #ifdef __LITTLE_ENDIAN__ 13832 #define vld2q_s8(__p0) __extension__ ({ \ 13833 int8x16x2_t __ret; \ 13834 __builtin_neon_vld2q_v(&__ret, __p0, 32); \ 13835 __ret; \ 13836 }) 13837 #else 13838 #define vld2q_s8(__p0) __extension__ ({ \ 13839 int8x16x2_t __ret; \ 13840 __builtin_neon_vld2q_v(&__ret, __p0, 32); \ 13841 \ 13842 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 13843 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 13844 __ret; \ 13845 }) 13846 #endif 13847 13848 #ifdef __LITTLE_ENDIAN__ 13849 #define vld2q_f32(__p0) __extension__ ({ \ 13850 float32x4x2_t __ret; \ 13851 __builtin_neon_vld2q_v(&__ret, __p0, 41); \ 13852 __ret; \ 13853 }) 13854 #else 13855 #define vld2q_f32(__p0) __extension__ ({ \ 13856 float32x4x2_t __ret; \ 13857 __builtin_neon_vld2q_v(&__ret, __p0, 41); \ 13858 \ 13859 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 13860 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 13861 __ret; \ 13862 }) 13863 #endif 13864 13865 #ifdef __LITTLE_ENDIAN__ 13866 #define vld2q_s32(__p0) __extension__ ({ \ 13867 int32x4x2_t __ret; \ 13868 __builtin_neon_vld2q_v(&__ret, __p0, 34); \ 13869 __ret; \ 13870 }) 13871 #else 13872 #define vld2q_s32(__p0) __extension__ ({ \ 13873 int32x4x2_t __ret; \ 13874 __builtin_neon_vld2q_v(&__ret, __p0, 34); \ 13875 \ 13876 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 13877 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 13878 __ret; \ 13879 }) 13880 #endif 13881 13882 #ifdef __LITTLE_ENDIAN__ 13883 #define vld2q_s16(__p0) __extension__ ({ \ 13884 int16x8x2_t __ret; \ 13885 __builtin_neon_vld2q_v(&__ret, __p0, 33); \ 13886 __ret; \ 13887 }) 13888 #else 13889 #define vld2q_s16(__p0) __extension__ ({ \ 13890 int16x8x2_t __ret; \ 13891 __builtin_neon_vld2q_v(&__ret, __p0, 33); \ 13892 \ 13893 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 13894 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 13895 __ret; \ 13896 }) 13897 #endif 13898 13899 #ifdef __LITTLE_ENDIAN__ 13900 #define vld2_u8(__p0) __extension__ ({ \ 13901 uint8x8x2_t __ret; \ 13902 __builtin_neon_vld2_v(&__ret, __p0, 16); \ 13903 __ret; \ 13904 }) 13905 #else 13906 #define vld2_u8(__p0) __extension__ ({ \ 13907 uint8x8x2_t __ret; \ 13908 __builtin_neon_vld2_v(&__ret, __p0, 16); \ 13909 \ 13910 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 13911 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 13912 __ret; \ 13913 }) 13914 #endif 13915 13916 #ifdef __LITTLE_ENDIAN__ 13917 #define vld2_u32(__p0) __extension__ ({ \ 13918 uint32x2x2_t __ret; \ 13919 __builtin_neon_vld2_v(&__ret, __p0, 18); \ 13920 __ret; \ 13921 }) 13922 #else 13923 #define vld2_u32(__p0) __extension__ ({ \ 13924 uint32x2x2_t __ret; \ 13925 __builtin_neon_vld2_v(&__ret, __p0, 18); \ 13926 \ 13927 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 13928 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 13929 __ret; \ 13930 }) 13931 #endif 13932 13933 #define vld2_u64(__p0) __extension__ ({ \ 13934 uint64x1x2_t __ret; \ 13935 __builtin_neon_vld2_v(&__ret, __p0, 19); \ 13936 __ret; \ 13937 }) 13938 #ifdef __LITTLE_ENDIAN__ 13939 #define vld2_u16(__p0) __extension__ ({ \ 13940 uint16x4x2_t __ret; \ 13941 __builtin_neon_vld2_v(&__ret, __p0, 17); \ 13942 __ret; \ 13943 }) 13944 #else 13945 #define vld2_u16(__p0) __extension__ ({ \ 13946 uint16x4x2_t __ret; \ 13947 __builtin_neon_vld2_v(&__ret, __p0, 17); \ 13948 \ 13949 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 13950 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 13951 __ret; \ 13952 }) 13953 #endif 13954 13955 #ifdef __LITTLE_ENDIAN__ 13956 #define vld2_s8(__p0) __extension__ ({ \ 13957 int8x8x2_t __ret; \ 13958 __builtin_neon_vld2_v(&__ret, __p0, 0); \ 13959 __ret; \ 13960 }) 13961 #else 13962 #define vld2_s8(__p0) __extension__ ({ \ 13963 int8x8x2_t __ret; \ 13964 __builtin_neon_vld2_v(&__ret, __p0, 0); \ 13965 \ 13966 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 13967 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 13968 __ret; \ 13969 }) 13970 #endif 13971 13972 #ifdef __LITTLE_ENDIAN__ 13973 #define vld2_f32(__p0) __extension__ ({ \ 13974 float32x2x2_t __ret; \ 13975 __builtin_neon_vld2_v(&__ret, __p0, 9); \ 13976 __ret; \ 13977 }) 13978 #else 13979 #define vld2_f32(__p0) __extension__ ({ \ 13980 float32x2x2_t __ret; \ 13981 __builtin_neon_vld2_v(&__ret, __p0, 9); \ 13982 \ 13983 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 13984 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 13985 __ret; \ 13986 }) 13987 #endif 13988 13989 #ifdef __LITTLE_ENDIAN__ 13990 #define vld2_s32(__p0) __extension__ ({ \ 13991 int32x2x2_t __ret; \ 13992 __builtin_neon_vld2_v(&__ret, __p0, 2); \ 13993 __ret; \ 13994 }) 13995 #else 13996 #define vld2_s32(__p0) __extension__ ({ \ 13997 int32x2x2_t __ret; \ 13998 __builtin_neon_vld2_v(&__ret, __p0, 2); \ 13999 \ 14000 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 14001 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 14002 __ret; \ 14003 }) 14004 #endif 14005 14006 #define vld2_s64(__p0) __extension__ ({ \ 14007 int64x1x2_t __ret; \ 14008 __builtin_neon_vld2_v(&__ret, __p0, 3); \ 14009 __ret; \ 14010 }) 14011 #ifdef __LITTLE_ENDIAN__ 14012 #define vld2_s16(__p0) __extension__ ({ \ 14013 int16x4x2_t __ret; \ 14014 __builtin_neon_vld2_v(&__ret, __p0, 1); \ 14015 __ret; \ 14016 }) 14017 #else 14018 #define vld2_s16(__p0) __extension__ ({ \ 14019 int16x4x2_t __ret; \ 14020 __builtin_neon_vld2_v(&__ret, __p0, 1); \ 14021 \ 14022 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 14023 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 14024 __ret; \ 14025 }) 14026 #endif 14027 14028 #ifdef __LITTLE_ENDIAN__ 14029 #define vld2_dup_p8(__p0) __extension__ ({ \ 14030 poly8x8x2_t __ret; \ 14031 __builtin_neon_vld2_dup_v(&__ret, __p0, 4); \ 14032 __ret; \ 14033 }) 14034 #else 14035 #define vld2_dup_p8(__p0) __extension__ ({ \ 14036 poly8x8x2_t __ret; \ 14037 __builtin_neon_vld2_dup_v(&__ret, __p0, 4); \ 14038 \ 14039 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 14040 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 14041 __ret; \ 14042 }) 14043 #endif 14044 14045 #ifdef __LITTLE_ENDIAN__ 14046 #define vld2_dup_p16(__p0) __extension__ ({ \ 14047 poly16x4x2_t __ret; \ 14048 __builtin_neon_vld2_dup_v(&__ret, __p0, 5); \ 14049 __ret; \ 14050 }) 14051 #else 14052 #define vld2_dup_p16(__p0) __extension__ ({ \ 14053 poly16x4x2_t __ret; \ 14054 __builtin_neon_vld2_dup_v(&__ret, __p0, 5); \ 14055 \ 14056 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 14057 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 14058 __ret; \ 14059 }) 14060 #endif 14061 14062 #ifdef __LITTLE_ENDIAN__ 14063 #define vld2q_dup_p8(__p0) __extension__ ({ \ 14064 poly8x16x2_t __ret; \ 14065 __builtin_neon_vld2q_dup_v(&__ret, __p0, 36); \ 14066 __ret; \ 14067 }) 14068 #else 14069 #define vld2q_dup_p8(__p0) __extension__ ({ \ 14070 poly8x16x2_t __ret; \ 14071 __builtin_neon_vld2q_dup_v(&__ret, __p0, 36); \ 14072 \ 14073 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 14074 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 14075 __ret; \ 14076 }) 14077 #endif 14078 14079 #ifdef __LITTLE_ENDIAN__ 14080 #define vld2q_dup_p16(__p0) __extension__ ({ \ 14081 poly16x8x2_t __ret; \ 14082 __builtin_neon_vld2q_dup_v(&__ret, __p0, 37); \ 14083 __ret; \ 14084 }) 14085 #else 14086 #define vld2q_dup_p16(__p0) __extension__ ({ \ 14087 poly16x8x2_t __ret; \ 14088 __builtin_neon_vld2q_dup_v(&__ret, __p0, 37); \ 14089 \ 14090 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 14091 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 14092 __ret; \ 14093 }) 14094 #endif 14095 14096 #ifdef __LITTLE_ENDIAN__ 14097 #define vld2q_dup_u8(__p0) __extension__ ({ \ 14098 uint8x16x2_t __ret; \ 14099 __builtin_neon_vld2q_dup_v(&__ret, __p0, 48); \ 14100 __ret; \ 14101 }) 14102 #else 14103 #define vld2q_dup_u8(__p0) __extension__ ({ \ 14104 uint8x16x2_t __ret; \ 14105 __builtin_neon_vld2q_dup_v(&__ret, __p0, 48); \ 14106 \ 14107 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 14108 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 14109 __ret; \ 14110 }) 14111 #endif 14112 14113 #ifdef __LITTLE_ENDIAN__ 14114 #define vld2q_dup_u32(__p0) __extension__ ({ \ 14115 uint32x4x2_t __ret; \ 14116 __builtin_neon_vld2q_dup_v(&__ret, __p0, 50); \ 14117 __ret; \ 14118 }) 14119 #else 14120 #define vld2q_dup_u32(__p0) __extension__ ({ \ 14121 uint32x4x2_t __ret; \ 14122 __builtin_neon_vld2q_dup_v(&__ret, __p0, 50); \ 14123 \ 14124 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 14125 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 14126 __ret; \ 14127 }) 14128 #endif 14129 14130 #ifdef __LITTLE_ENDIAN__ 14131 #define vld2q_dup_u64(__p0) __extension__ ({ \ 14132 uint64x2x2_t __ret; \ 14133 __builtin_neon_vld2q_dup_v(&__ret, __p0, 51); \ 14134 __ret; \ 14135 }) 14136 #else 14137 #define vld2q_dup_u64(__p0) __extension__ ({ \ 14138 uint64x2x2_t __ret; \ 14139 __builtin_neon_vld2q_dup_v(&__ret, __p0, 51); \ 14140 \ 14141 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 14142 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 14143 __ret; \ 14144 }) 14145 #endif 14146 14147 #ifdef __LITTLE_ENDIAN__ 14148 #define vld2q_dup_u16(__p0) __extension__ ({ \ 14149 uint16x8x2_t __ret; \ 14150 __builtin_neon_vld2q_dup_v(&__ret, __p0, 49); \ 14151 __ret; \ 14152 }) 14153 #else 14154 #define vld2q_dup_u16(__p0) __extension__ ({ \ 14155 uint16x8x2_t __ret; \ 14156 __builtin_neon_vld2q_dup_v(&__ret, __p0, 49); \ 14157 \ 14158 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 14159 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 14160 __ret; \ 14161 }) 14162 #endif 14163 14164 #ifdef __LITTLE_ENDIAN__ 14165 #define vld2q_dup_s8(__p0) __extension__ ({ \ 14166 int8x16x2_t __ret; \ 14167 __builtin_neon_vld2q_dup_v(&__ret, __p0, 32); \ 14168 __ret; \ 14169 }) 14170 #else 14171 #define vld2q_dup_s8(__p0) __extension__ ({ \ 14172 int8x16x2_t __ret; \ 14173 __builtin_neon_vld2q_dup_v(&__ret, __p0, 32); \ 14174 \ 14175 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 14176 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 14177 __ret; \ 14178 }) 14179 #endif 14180 14181 #ifdef __LITTLE_ENDIAN__ 14182 #define vld2q_dup_f32(__p0) __extension__ ({ \ 14183 float32x4x2_t __ret; \ 14184 __builtin_neon_vld2q_dup_v(&__ret, __p0, 41); \ 14185 __ret; \ 14186 }) 14187 #else 14188 #define vld2q_dup_f32(__p0) __extension__ ({ \ 14189 float32x4x2_t __ret; \ 14190 __builtin_neon_vld2q_dup_v(&__ret, __p0, 41); \ 14191 \ 14192 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 14193 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 14194 __ret; \ 14195 }) 14196 #endif 14197 14198 #ifdef __LITTLE_ENDIAN__ 14199 #define vld2q_dup_s32(__p0) __extension__ ({ \ 14200 int32x4x2_t __ret; \ 14201 __builtin_neon_vld2q_dup_v(&__ret, __p0, 34); \ 14202 __ret; \ 14203 }) 14204 #else 14205 #define vld2q_dup_s32(__p0) __extension__ ({ \ 14206 int32x4x2_t __ret; \ 14207 __builtin_neon_vld2q_dup_v(&__ret, __p0, 34); \ 14208 \ 14209 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 14210 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 14211 __ret; \ 14212 }) 14213 #endif 14214 14215 #ifdef __LITTLE_ENDIAN__ 14216 #define vld2q_dup_s64(__p0) __extension__ ({ \ 14217 int64x2x2_t __ret; \ 14218 __builtin_neon_vld2q_dup_v(&__ret, __p0, 35); \ 14219 __ret; \ 14220 }) 14221 #else 14222 #define vld2q_dup_s64(__p0) __extension__ ({ \ 14223 int64x2x2_t __ret; \ 14224 __builtin_neon_vld2q_dup_v(&__ret, __p0, 35); \ 14225 \ 14226 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 14227 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 14228 __ret; \ 14229 }) 14230 #endif 14231 14232 #ifdef __LITTLE_ENDIAN__ 14233 #define vld2q_dup_s16(__p0) __extension__ ({ \ 14234 int16x8x2_t __ret; \ 14235 __builtin_neon_vld2q_dup_v(&__ret, __p0, 33); \ 14236 __ret; \ 14237 }) 14238 #else 14239 #define vld2q_dup_s16(__p0) __extension__ ({ \ 14240 int16x8x2_t __ret; \ 14241 __builtin_neon_vld2q_dup_v(&__ret, __p0, 33); \ 14242 \ 14243 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 14244 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 14245 __ret; \ 14246 }) 14247 #endif 14248 14249 #ifdef __LITTLE_ENDIAN__ 14250 #define vld2_dup_u8(__p0) __extension__ ({ \ 14251 uint8x8x2_t __ret; \ 14252 __builtin_neon_vld2_dup_v(&__ret, __p0, 16); \ 14253 __ret; \ 14254 }) 14255 #else 14256 #define vld2_dup_u8(__p0) __extension__ ({ \ 14257 uint8x8x2_t __ret; \ 14258 __builtin_neon_vld2_dup_v(&__ret, __p0, 16); \ 14259 \ 14260 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 14261 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 14262 __ret; \ 14263 }) 14264 #endif 14265 14266 #ifdef __LITTLE_ENDIAN__ 14267 #define vld2_dup_u32(__p0) __extension__ ({ \ 14268 uint32x2x2_t __ret; \ 14269 __builtin_neon_vld2_dup_v(&__ret, __p0, 18); \ 14270 __ret; \ 14271 }) 14272 #else 14273 #define vld2_dup_u32(__p0) __extension__ ({ \ 14274 uint32x2x2_t __ret; \ 14275 __builtin_neon_vld2_dup_v(&__ret, __p0, 18); \ 14276 \ 14277 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 14278 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 14279 __ret; \ 14280 }) 14281 #endif 14282 14283 #define vld2_dup_u64(__p0) __extension__ ({ \ 14284 uint64x1x2_t __ret; \ 14285 __builtin_neon_vld2_dup_v(&__ret, __p0, 19); \ 14286 __ret; \ 14287 }) 14288 #ifdef __LITTLE_ENDIAN__ 14289 #define vld2_dup_u16(__p0) __extension__ ({ \ 14290 uint16x4x2_t __ret; \ 14291 __builtin_neon_vld2_dup_v(&__ret, __p0, 17); \ 14292 __ret; \ 14293 }) 14294 #else 14295 #define vld2_dup_u16(__p0) __extension__ ({ \ 14296 uint16x4x2_t __ret; \ 14297 __builtin_neon_vld2_dup_v(&__ret, __p0, 17); \ 14298 \ 14299 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 14300 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 14301 __ret; \ 14302 }) 14303 #endif 14304 14305 #ifdef __LITTLE_ENDIAN__ 14306 #define vld2_dup_s8(__p0) __extension__ ({ \ 14307 int8x8x2_t __ret; \ 14308 __builtin_neon_vld2_dup_v(&__ret, __p0, 0); \ 14309 __ret; \ 14310 }) 14311 #else 14312 #define vld2_dup_s8(__p0) __extension__ ({ \ 14313 int8x8x2_t __ret; \ 14314 __builtin_neon_vld2_dup_v(&__ret, __p0, 0); \ 14315 \ 14316 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 14317 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 14318 __ret; \ 14319 }) 14320 #endif 14321 14322 #ifdef __LITTLE_ENDIAN__ 14323 #define vld2_dup_f32(__p0) __extension__ ({ \ 14324 float32x2x2_t __ret; \ 14325 __builtin_neon_vld2_dup_v(&__ret, __p0, 9); \ 14326 __ret; \ 14327 }) 14328 #else 14329 #define vld2_dup_f32(__p0) __extension__ ({ \ 14330 float32x2x2_t __ret; \ 14331 __builtin_neon_vld2_dup_v(&__ret, __p0, 9); \ 14332 \ 14333 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 14334 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 14335 __ret; \ 14336 }) 14337 #endif 14338 14339 #ifdef __LITTLE_ENDIAN__ 14340 #define vld2_dup_s32(__p0) __extension__ ({ \ 14341 int32x2x2_t __ret; \ 14342 __builtin_neon_vld2_dup_v(&__ret, __p0, 2); \ 14343 __ret; \ 14344 }) 14345 #else 14346 #define vld2_dup_s32(__p0) __extension__ ({ \ 14347 int32x2x2_t __ret; \ 14348 __builtin_neon_vld2_dup_v(&__ret, __p0, 2); \ 14349 \ 14350 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 14351 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 14352 __ret; \ 14353 }) 14354 #endif 14355 14356 #define vld2_dup_s64(__p0) __extension__ ({ \ 14357 int64x1x2_t __ret; \ 14358 __builtin_neon_vld2_dup_v(&__ret, __p0, 3); \ 14359 __ret; \ 14360 }) 14361 #ifdef __LITTLE_ENDIAN__ 14362 #define vld2_dup_s16(__p0) __extension__ ({ \ 14363 int16x4x2_t __ret; \ 14364 __builtin_neon_vld2_dup_v(&__ret, __p0, 1); \ 14365 __ret; \ 14366 }) 14367 #else 14368 #define vld2_dup_s16(__p0) __extension__ ({ \ 14369 int16x4x2_t __ret; \ 14370 __builtin_neon_vld2_dup_v(&__ret, __p0, 1); \ 14371 \ 14372 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 14373 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 14374 __ret; \ 14375 }) 14376 #endif 14377 14378 #ifdef __LITTLE_ENDIAN__ 14379 #define vld2_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 14380 poly8x8x2_t __ret; \ 14381 poly8x8x2_t __s1 = __p1; \ 14382 __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 4); \ 14383 __ret; \ 14384 }) 14385 #else 14386 #define vld2_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 14387 poly8x8x2_t __ret; \ 14388 poly8x8x2_t __s1 = __p1; \ 14389 poly8x8x2_t __rev1; \ 14390 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 14391 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 14392 __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 4); \ 14393 \ 14394 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 14395 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 14396 __ret; \ 14397 }) 14398 #endif 14399 14400 #ifdef __LITTLE_ENDIAN__ 14401 #define vld2_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 14402 poly16x4x2_t __ret; \ 14403 poly16x4x2_t __s1 = __p1; \ 14404 __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 5); \ 14405 __ret; \ 14406 }) 14407 #else 14408 #define vld2_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 14409 poly16x4x2_t __ret; \ 14410 poly16x4x2_t __s1 = __p1; \ 14411 poly16x4x2_t __rev1; \ 14412 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 14413 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 14414 __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 5); \ 14415 \ 14416 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 14417 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 14418 __ret; \ 14419 }) 14420 #endif 14421 14422 #ifdef __LITTLE_ENDIAN__ 14423 #define vld2q_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 14424 poly16x8x2_t __ret; \ 14425 poly16x8x2_t __s1 = __p1; \ 14426 __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 37); \ 14427 __ret; \ 14428 }) 14429 #else 14430 #define vld2q_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 14431 poly16x8x2_t __ret; \ 14432 poly16x8x2_t __s1 = __p1; \ 14433 poly16x8x2_t __rev1; \ 14434 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 14435 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 14436 __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 37); \ 14437 \ 14438 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 14439 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 14440 __ret; \ 14441 }) 14442 #endif 14443 14444 #ifdef __LITTLE_ENDIAN__ 14445 #define vld2q_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 14446 uint32x4x2_t __ret; \ 14447 uint32x4x2_t __s1 = __p1; \ 14448 __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 50); \ 14449 __ret; \ 14450 }) 14451 #else 14452 #define vld2q_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 14453 uint32x4x2_t __ret; \ 14454 uint32x4x2_t __s1 = __p1; \ 14455 uint32x4x2_t __rev1; \ 14456 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 14457 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 14458 __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 50); \ 14459 \ 14460 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 14461 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 14462 __ret; \ 14463 }) 14464 #endif 14465 14466 #ifdef __LITTLE_ENDIAN__ 14467 #define vld2q_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 14468 uint16x8x2_t __ret; \ 14469 uint16x8x2_t __s1 = __p1; \ 14470 __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 49); \ 14471 __ret; \ 14472 }) 14473 #else 14474 #define vld2q_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 14475 uint16x8x2_t __ret; \ 14476 uint16x8x2_t __s1 = __p1; \ 14477 uint16x8x2_t __rev1; \ 14478 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 14479 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 14480 __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 49); \ 14481 \ 14482 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 14483 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 14484 __ret; \ 14485 }) 14486 #endif 14487 14488 #ifdef __LITTLE_ENDIAN__ 14489 #define vld2q_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 14490 float32x4x2_t __ret; \ 14491 float32x4x2_t __s1 = __p1; \ 14492 __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 41); \ 14493 __ret; \ 14494 }) 14495 #else 14496 #define vld2q_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 14497 float32x4x2_t __ret; \ 14498 float32x4x2_t __s1 = __p1; \ 14499 float32x4x2_t __rev1; \ 14500 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 14501 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 14502 __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 41); \ 14503 \ 14504 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 14505 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 14506 __ret; \ 14507 }) 14508 #endif 14509 14510 #ifdef __LITTLE_ENDIAN__ 14511 #define vld2q_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 14512 int32x4x2_t __ret; \ 14513 int32x4x2_t __s1 = __p1; \ 14514 __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 34); \ 14515 __ret; \ 14516 }) 14517 #else 14518 #define vld2q_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 14519 int32x4x2_t __ret; \ 14520 int32x4x2_t __s1 = __p1; \ 14521 int32x4x2_t __rev1; \ 14522 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 14523 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 14524 __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 34); \ 14525 \ 14526 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 14527 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 14528 __ret; \ 14529 }) 14530 #endif 14531 14532 #ifdef __LITTLE_ENDIAN__ 14533 #define vld2q_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 14534 int16x8x2_t __ret; \ 14535 int16x8x2_t __s1 = __p1; \ 14536 __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 33); \ 14537 __ret; \ 14538 }) 14539 #else 14540 #define vld2q_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 14541 int16x8x2_t __ret; \ 14542 int16x8x2_t __s1 = __p1; \ 14543 int16x8x2_t __rev1; \ 14544 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 14545 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 14546 __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 33); \ 14547 \ 14548 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 14549 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 14550 __ret; \ 14551 }) 14552 #endif 14553 14554 #ifdef __LITTLE_ENDIAN__ 14555 #define vld2_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 14556 uint8x8x2_t __ret; \ 14557 uint8x8x2_t __s1 = __p1; \ 14558 __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 16); \ 14559 __ret; \ 14560 }) 14561 #else 14562 #define vld2_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 14563 uint8x8x2_t __ret; \ 14564 uint8x8x2_t __s1 = __p1; \ 14565 uint8x8x2_t __rev1; \ 14566 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 14567 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 14568 __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 16); \ 14569 \ 14570 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 14571 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 14572 __ret; \ 14573 }) 14574 #endif 14575 14576 #ifdef __LITTLE_ENDIAN__ 14577 #define vld2_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 14578 uint32x2x2_t __ret; \ 14579 uint32x2x2_t __s1 = __p1; \ 14580 __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 18); \ 14581 __ret; \ 14582 }) 14583 #else 14584 #define vld2_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 14585 uint32x2x2_t __ret; \ 14586 uint32x2x2_t __s1 = __p1; \ 14587 uint32x2x2_t __rev1; \ 14588 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 14589 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 14590 __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 18); \ 14591 \ 14592 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 14593 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 14594 __ret; \ 14595 }) 14596 #endif 14597 14598 #ifdef __LITTLE_ENDIAN__ 14599 #define vld2_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 14600 uint16x4x2_t __ret; \ 14601 uint16x4x2_t __s1 = __p1; \ 14602 __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 17); \ 14603 __ret; \ 14604 }) 14605 #else 14606 #define vld2_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 14607 uint16x4x2_t __ret; \ 14608 uint16x4x2_t __s1 = __p1; \ 14609 uint16x4x2_t __rev1; \ 14610 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 14611 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 14612 __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 17); \ 14613 \ 14614 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 14615 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 14616 __ret; \ 14617 }) 14618 #endif 14619 14620 #ifdef __LITTLE_ENDIAN__ 14621 #define vld2_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 14622 int8x8x2_t __ret; \ 14623 int8x8x2_t __s1 = __p1; \ 14624 __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 0); \ 14625 __ret; \ 14626 }) 14627 #else 14628 #define vld2_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 14629 int8x8x2_t __ret; \ 14630 int8x8x2_t __s1 = __p1; \ 14631 int8x8x2_t __rev1; \ 14632 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 14633 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 14634 __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 0); \ 14635 \ 14636 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 14637 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 14638 __ret; \ 14639 }) 14640 #endif 14641 14642 #ifdef __LITTLE_ENDIAN__ 14643 #define vld2_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 14644 float32x2x2_t __ret; \ 14645 float32x2x2_t __s1 = __p1; \ 14646 __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 9); \ 14647 __ret; \ 14648 }) 14649 #else 14650 #define vld2_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 14651 float32x2x2_t __ret; \ 14652 float32x2x2_t __s1 = __p1; \ 14653 float32x2x2_t __rev1; \ 14654 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 14655 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 14656 __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 9); \ 14657 \ 14658 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 14659 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 14660 __ret; \ 14661 }) 14662 #endif 14663 14664 #ifdef __LITTLE_ENDIAN__ 14665 #define vld2_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 14666 int32x2x2_t __ret; \ 14667 int32x2x2_t __s1 = __p1; \ 14668 __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 2); \ 14669 __ret; \ 14670 }) 14671 #else 14672 #define vld2_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 14673 int32x2x2_t __ret; \ 14674 int32x2x2_t __s1 = __p1; \ 14675 int32x2x2_t __rev1; \ 14676 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 14677 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 14678 __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 2); \ 14679 \ 14680 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 14681 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 14682 __ret; \ 14683 }) 14684 #endif 14685 14686 #ifdef __LITTLE_ENDIAN__ 14687 #define vld2_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 14688 int16x4x2_t __ret; \ 14689 int16x4x2_t __s1 = __p1; \ 14690 __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 1); \ 14691 __ret; \ 14692 }) 14693 #else 14694 #define vld2_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 14695 int16x4x2_t __ret; \ 14696 int16x4x2_t __s1 = __p1; \ 14697 int16x4x2_t __rev1; \ 14698 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 14699 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 14700 __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 1); \ 14701 \ 14702 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 14703 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 14704 __ret; \ 14705 }) 14706 #endif 14707 14708 #ifdef __LITTLE_ENDIAN__ 14709 #define vld3_p8(__p0) __extension__ ({ \ 14710 poly8x8x3_t __ret; \ 14711 __builtin_neon_vld3_v(&__ret, __p0, 4); \ 14712 __ret; \ 14713 }) 14714 #else 14715 #define vld3_p8(__p0) __extension__ ({ \ 14716 poly8x8x3_t __ret; \ 14717 __builtin_neon_vld3_v(&__ret, __p0, 4); \ 14718 \ 14719 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 14720 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 14721 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 14722 __ret; \ 14723 }) 14724 #endif 14725 14726 #ifdef __LITTLE_ENDIAN__ 14727 #define vld3_p16(__p0) __extension__ ({ \ 14728 poly16x4x3_t __ret; \ 14729 __builtin_neon_vld3_v(&__ret, __p0, 5); \ 14730 __ret; \ 14731 }) 14732 #else 14733 #define vld3_p16(__p0) __extension__ ({ \ 14734 poly16x4x3_t __ret; \ 14735 __builtin_neon_vld3_v(&__ret, __p0, 5); \ 14736 \ 14737 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 14738 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 14739 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 14740 __ret; \ 14741 }) 14742 #endif 14743 14744 #ifdef __LITTLE_ENDIAN__ 14745 #define vld3q_p8(__p0) __extension__ ({ \ 14746 poly8x16x3_t __ret; \ 14747 __builtin_neon_vld3q_v(&__ret, __p0, 36); \ 14748 __ret; \ 14749 }) 14750 #else 14751 #define vld3q_p8(__p0) __extension__ ({ \ 14752 poly8x16x3_t __ret; \ 14753 __builtin_neon_vld3q_v(&__ret, __p0, 36); \ 14754 \ 14755 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 14756 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 14757 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 14758 __ret; \ 14759 }) 14760 #endif 14761 14762 #ifdef __LITTLE_ENDIAN__ 14763 #define vld3q_p16(__p0) __extension__ ({ \ 14764 poly16x8x3_t __ret; \ 14765 __builtin_neon_vld3q_v(&__ret, __p0, 37); \ 14766 __ret; \ 14767 }) 14768 #else 14769 #define vld3q_p16(__p0) __extension__ ({ \ 14770 poly16x8x3_t __ret; \ 14771 __builtin_neon_vld3q_v(&__ret, __p0, 37); \ 14772 \ 14773 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 14774 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 14775 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 14776 __ret; \ 14777 }) 14778 #endif 14779 14780 #ifdef __LITTLE_ENDIAN__ 14781 #define vld3q_u8(__p0) __extension__ ({ \ 14782 uint8x16x3_t __ret; \ 14783 __builtin_neon_vld3q_v(&__ret, __p0, 48); \ 14784 __ret; \ 14785 }) 14786 #else 14787 #define vld3q_u8(__p0) __extension__ ({ \ 14788 uint8x16x3_t __ret; \ 14789 __builtin_neon_vld3q_v(&__ret, __p0, 48); \ 14790 \ 14791 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 14792 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 14793 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 14794 __ret; \ 14795 }) 14796 #endif 14797 14798 #ifdef __LITTLE_ENDIAN__ 14799 #define vld3q_u32(__p0) __extension__ ({ \ 14800 uint32x4x3_t __ret; \ 14801 __builtin_neon_vld3q_v(&__ret, __p0, 50); \ 14802 __ret; \ 14803 }) 14804 #else 14805 #define vld3q_u32(__p0) __extension__ ({ \ 14806 uint32x4x3_t __ret; \ 14807 __builtin_neon_vld3q_v(&__ret, __p0, 50); \ 14808 \ 14809 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 14810 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 14811 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 14812 __ret; \ 14813 }) 14814 #endif 14815 14816 #ifdef __LITTLE_ENDIAN__ 14817 #define vld3q_u16(__p0) __extension__ ({ \ 14818 uint16x8x3_t __ret; \ 14819 __builtin_neon_vld3q_v(&__ret, __p0, 49); \ 14820 __ret; \ 14821 }) 14822 #else 14823 #define vld3q_u16(__p0) __extension__ ({ \ 14824 uint16x8x3_t __ret; \ 14825 __builtin_neon_vld3q_v(&__ret, __p0, 49); \ 14826 \ 14827 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 14828 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 14829 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 14830 __ret; \ 14831 }) 14832 #endif 14833 14834 #ifdef __LITTLE_ENDIAN__ 14835 #define vld3q_s8(__p0) __extension__ ({ \ 14836 int8x16x3_t __ret; \ 14837 __builtin_neon_vld3q_v(&__ret, __p0, 32); \ 14838 __ret; \ 14839 }) 14840 #else 14841 #define vld3q_s8(__p0) __extension__ ({ \ 14842 int8x16x3_t __ret; \ 14843 __builtin_neon_vld3q_v(&__ret, __p0, 32); \ 14844 \ 14845 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 14846 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 14847 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 14848 __ret; \ 14849 }) 14850 #endif 14851 14852 #ifdef __LITTLE_ENDIAN__ 14853 #define vld3q_f32(__p0) __extension__ ({ \ 14854 float32x4x3_t __ret; \ 14855 __builtin_neon_vld3q_v(&__ret, __p0, 41); \ 14856 __ret; \ 14857 }) 14858 #else 14859 #define vld3q_f32(__p0) __extension__ ({ \ 14860 float32x4x3_t __ret; \ 14861 __builtin_neon_vld3q_v(&__ret, __p0, 41); \ 14862 \ 14863 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 14864 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 14865 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 14866 __ret; \ 14867 }) 14868 #endif 14869 14870 #ifdef __LITTLE_ENDIAN__ 14871 #define vld3q_s32(__p0) __extension__ ({ \ 14872 int32x4x3_t __ret; \ 14873 __builtin_neon_vld3q_v(&__ret, __p0, 34); \ 14874 __ret; \ 14875 }) 14876 #else 14877 #define vld3q_s32(__p0) __extension__ ({ \ 14878 int32x4x3_t __ret; \ 14879 __builtin_neon_vld3q_v(&__ret, __p0, 34); \ 14880 \ 14881 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 14882 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 14883 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 14884 __ret; \ 14885 }) 14886 #endif 14887 14888 #ifdef __LITTLE_ENDIAN__ 14889 #define vld3q_s16(__p0) __extension__ ({ \ 14890 int16x8x3_t __ret; \ 14891 __builtin_neon_vld3q_v(&__ret, __p0, 33); \ 14892 __ret; \ 14893 }) 14894 #else 14895 #define vld3q_s16(__p0) __extension__ ({ \ 14896 int16x8x3_t __ret; \ 14897 __builtin_neon_vld3q_v(&__ret, __p0, 33); \ 14898 \ 14899 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 14900 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 14901 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 14902 __ret; \ 14903 }) 14904 #endif 14905 14906 #ifdef __LITTLE_ENDIAN__ 14907 #define vld3_u8(__p0) __extension__ ({ \ 14908 uint8x8x3_t __ret; \ 14909 __builtin_neon_vld3_v(&__ret, __p0, 16); \ 14910 __ret; \ 14911 }) 14912 #else 14913 #define vld3_u8(__p0) __extension__ ({ \ 14914 uint8x8x3_t __ret; \ 14915 __builtin_neon_vld3_v(&__ret, __p0, 16); \ 14916 \ 14917 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 14918 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 14919 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 14920 __ret; \ 14921 }) 14922 #endif 14923 14924 #ifdef __LITTLE_ENDIAN__ 14925 #define vld3_u32(__p0) __extension__ ({ \ 14926 uint32x2x3_t __ret; \ 14927 __builtin_neon_vld3_v(&__ret, __p0, 18); \ 14928 __ret; \ 14929 }) 14930 #else 14931 #define vld3_u32(__p0) __extension__ ({ \ 14932 uint32x2x3_t __ret; \ 14933 __builtin_neon_vld3_v(&__ret, __p0, 18); \ 14934 \ 14935 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 14936 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 14937 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 14938 __ret; \ 14939 }) 14940 #endif 14941 14942 #define vld3_u64(__p0) __extension__ ({ \ 14943 uint64x1x3_t __ret; \ 14944 __builtin_neon_vld3_v(&__ret, __p0, 19); \ 14945 __ret; \ 14946 }) 14947 #ifdef __LITTLE_ENDIAN__ 14948 #define vld3_u16(__p0) __extension__ ({ \ 14949 uint16x4x3_t __ret; \ 14950 __builtin_neon_vld3_v(&__ret, __p0, 17); \ 14951 __ret; \ 14952 }) 14953 #else 14954 #define vld3_u16(__p0) __extension__ ({ \ 14955 uint16x4x3_t __ret; \ 14956 __builtin_neon_vld3_v(&__ret, __p0, 17); \ 14957 \ 14958 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 14959 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 14960 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 14961 __ret; \ 14962 }) 14963 #endif 14964 14965 #ifdef __LITTLE_ENDIAN__ 14966 #define vld3_s8(__p0) __extension__ ({ \ 14967 int8x8x3_t __ret; \ 14968 __builtin_neon_vld3_v(&__ret, __p0, 0); \ 14969 __ret; \ 14970 }) 14971 #else 14972 #define vld3_s8(__p0) __extension__ ({ \ 14973 int8x8x3_t __ret; \ 14974 __builtin_neon_vld3_v(&__ret, __p0, 0); \ 14975 \ 14976 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 14977 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 14978 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 14979 __ret; \ 14980 }) 14981 #endif 14982 14983 #ifdef __LITTLE_ENDIAN__ 14984 #define vld3_f32(__p0) __extension__ ({ \ 14985 float32x2x3_t __ret; \ 14986 __builtin_neon_vld3_v(&__ret, __p0, 9); \ 14987 __ret; \ 14988 }) 14989 #else 14990 #define vld3_f32(__p0) __extension__ ({ \ 14991 float32x2x3_t __ret; \ 14992 __builtin_neon_vld3_v(&__ret, __p0, 9); \ 14993 \ 14994 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 14995 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 14996 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 14997 __ret; \ 14998 }) 14999 #endif 15000 15001 #ifdef __LITTLE_ENDIAN__ 15002 #define vld3_s32(__p0) __extension__ ({ \ 15003 int32x2x3_t __ret; \ 15004 __builtin_neon_vld3_v(&__ret, __p0, 2); \ 15005 __ret; \ 15006 }) 15007 #else 15008 #define vld3_s32(__p0) __extension__ ({ \ 15009 int32x2x3_t __ret; \ 15010 __builtin_neon_vld3_v(&__ret, __p0, 2); \ 15011 \ 15012 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 15013 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 15014 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 15015 __ret; \ 15016 }) 15017 #endif 15018 15019 #define vld3_s64(__p0) __extension__ ({ \ 15020 int64x1x3_t __ret; \ 15021 __builtin_neon_vld3_v(&__ret, __p0, 3); \ 15022 __ret; \ 15023 }) 15024 #ifdef __LITTLE_ENDIAN__ 15025 #define vld3_s16(__p0) __extension__ ({ \ 15026 int16x4x3_t __ret; \ 15027 __builtin_neon_vld3_v(&__ret, __p0, 1); \ 15028 __ret; \ 15029 }) 15030 #else 15031 #define vld3_s16(__p0) __extension__ ({ \ 15032 int16x4x3_t __ret; \ 15033 __builtin_neon_vld3_v(&__ret, __p0, 1); \ 15034 \ 15035 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 15036 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 15037 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 15038 __ret; \ 15039 }) 15040 #endif 15041 15042 #ifdef __LITTLE_ENDIAN__ 15043 #define vld3_dup_p8(__p0) __extension__ ({ \ 15044 poly8x8x3_t __ret; \ 15045 __builtin_neon_vld3_dup_v(&__ret, __p0, 4); \ 15046 __ret; \ 15047 }) 15048 #else 15049 #define vld3_dup_p8(__p0) __extension__ ({ \ 15050 poly8x8x3_t __ret; \ 15051 __builtin_neon_vld3_dup_v(&__ret, __p0, 4); \ 15052 \ 15053 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 15054 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 15055 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 15056 __ret; \ 15057 }) 15058 #endif 15059 15060 #ifdef __LITTLE_ENDIAN__ 15061 #define vld3_dup_p16(__p0) __extension__ ({ \ 15062 poly16x4x3_t __ret; \ 15063 __builtin_neon_vld3_dup_v(&__ret, __p0, 5); \ 15064 __ret; \ 15065 }) 15066 #else 15067 #define vld3_dup_p16(__p0) __extension__ ({ \ 15068 poly16x4x3_t __ret; \ 15069 __builtin_neon_vld3_dup_v(&__ret, __p0, 5); \ 15070 \ 15071 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 15072 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 15073 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 15074 __ret; \ 15075 }) 15076 #endif 15077 15078 #ifdef __LITTLE_ENDIAN__ 15079 #define vld3q_dup_p8(__p0) __extension__ ({ \ 15080 poly8x16x3_t __ret; \ 15081 __builtin_neon_vld3q_dup_v(&__ret, __p0, 36); \ 15082 __ret; \ 15083 }) 15084 #else 15085 #define vld3q_dup_p8(__p0) __extension__ ({ \ 15086 poly8x16x3_t __ret; \ 15087 __builtin_neon_vld3q_dup_v(&__ret, __p0, 36); \ 15088 \ 15089 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 15090 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 15091 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 15092 __ret; \ 15093 }) 15094 #endif 15095 15096 #ifdef __LITTLE_ENDIAN__ 15097 #define vld3q_dup_p16(__p0) __extension__ ({ \ 15098 poly16x8x3_t __ret; \ 15099 __builtin_neon_vld3q_dup_v(&__ret, __p0, 37); \ 15100 __ret; \ 15101 }) 15102 #else 15103 #define vld3q_dup_p16(__p0) __extension__ ({ \ 15104 poly16x8x3_t __ret; \ 15105 __builtin_neon_vld3q_dup_v(&__ret, __p0, 37); \ 15106 \ 15107 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 15108 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 15109 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 15110 __ret; \ 15111 }) 15112 #endif 15113 15114 #ifdef __LITTLE_ENDIAN__ 15115 #define vld3q_dup_u8(__p0) __extension__ ({ \ 15116 uint8x16x3_t __ret; \ 15117 __builtin_neon_vld3q_dup_v(&__ret, __p0, 48); \ 15118 __ret; \ 15119 }) 15120 #else 15121 #define vld3q_dup_u8(__p0) __extension__ ({ \ 15122 uint8x16x3_t __ret; \ 15123 __builtin_neon_vld3q_dup_v(&__ret, __p0, 48); \ 15124 \ 15125 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 15126 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 15127 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 15128 __ret; \ 15129 }) 15130 #endif 15131 15132 #ifdef __LITTLE_ENDIAN__ 15133 #define vld3q_dup_u32(__p0) __extension__ ({ \ 15134 uint32x4x3_t __ret; \ 15135 __builtin_neon_vld3q_dup_v(&__ret, __p0, 50); \ 15136 __ret; \ 15137 }) 15138 #else 15139 #define vld3q_dup_u32(__p0) __extension__ ({ \ 15140 uint32x4x3_t __ret; \ 15141 __builtin_neon_vld3q_dup_v(&__ret, __p0, 50); \ 15142 \ 15143 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 15144 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 15145 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 15146 __ret; \ 15147 }) 15148 #endif 15149 15150 #ifdef __LITTLE_ENDIAN__ 15151 #define vld3q_dup_u64(__p0) __extension__ ({ \ 15152 uint64x2x3_t __ret; \ 15153 __builtin_neon_vld3q_dup_v(&__ret, __p0, 51); \ 15154 __ret; \ 15155 }) 15156 #else 15157 #define vld3q_dup_u64(__p0) __extension__ ({ \ 15158 uint64x2x3_t __ret; \ 15159 __builtin_neon_vld3q_dup_v(&__ret, __p0, 51); \ 15160 \ 15161 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 15162 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 15163 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 15164 __ret; \ 15165 }) 15166 #endif 15167 15168 #ifdef __LITTLE_ENDIAN__ 15169 #define vld3q_dup_u16(__p0) __extension__ ({ \ 15170 uint16x8x3_t __ret; \ 15171 __builtin_neon_vld3q_dup_v(&__ret, __p0, 49); \ 15172 __ret; \ 15173 }) 15174 #else 15175 #define vld3q_dup_u16(__p0) __extension__ ({ \ 15176 uint16x8x3_t __ret; \ 15177 __builtin_neon_vld3q_dup_v(&__ret, __p0, 49); \ 15178 \ 15179 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 15180 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 15181 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 15182 __ret; \ 15183 }) 15184 #endif 15185 15186 #ifdef __LITTLE_ENDIAN__ 15187 #define vld3q_dup_s8(__p0) __extension__ ({ \ 15188 int8x16x3_t __ret; \ 15189 __builtin_neon_vld3q_dup_v(&__ret, __p0, 32); \ 15190 __ret; \ 15191 }) 15192 #else 15193 #define vld3q_dup_s8(__p0) __extension__ ({ \ 15194 int8x16x3_t __ret; \ 15195 __builtin_neon_vld3q_dup_v(&__ret, __p0, 32); \ 15196 \ 15197 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 15198 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 15199 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 15200 __ret; \ 15201 }) 15202 #endif 15203 15204 #ifdef __LITTLE_ENDIAN__ 15205 #define vld3q_dup_f32(__p0) __extension__ ({ \ 15206 float32x4x3_t __ret; \ 15207 __builtin_neon_vld3q_dup_v(&__ret, __p0, 41); \ 15208 __ret; \ 15209 }) 15210 #else 15211 #define vld3q_dup_f32(__p0) __extension__ ({ \ 15212 float32x4x3_t __ret; \ 15213 __builtin_neon_vld3q_dup_v(&__ret, __p0, 41); \ 15214 \ 15215 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 15216 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 15217 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 15218 __ret; \ 15219 }) 15220 #endif 15221 15222 #ifdef __LITTLE_ENDIAN__ 15223 #define vld3q_dup_s32(__p0) __extension__ ({ \ 15224 int32x4x3_t __ret; \ 15225 __builtin_neon_vld3q_dup_v(&__ret, __p0, 34); \ 15226 __ret; \ 15227 }) 15228 #else 15229 #define vld3q_dup_s32(__p0) __extension__ ({ \ 15230 int32x4x3_t __ret; \ 15231 __builtin_neon_vld3q_dup_v(&__ret, __p0, 34); \ 15232 \ 15233 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 15234 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 15235 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 15236 __ret; \ 15237 }) 15238 #endif 15239 15240 #ifdef __LITTLE_ENDIAN__ 15241 #define vld3q_dup_s64(__p0) __extension__ ({ \ 15242 int64x2x3_t __ret; \ 15243 __builtin_neon_vld3q_dup_v(&__ret, __p0, 35); \ 15244 __ret; \ 15245 }) 15246 #else 15247 #define vld3q_dup_s64(__p0) __extension__ ({ \ 15248 int64x2x3_t __ret; \ 15249 __builtin_neon_vld3q_dup_v(&__ret, __p0, 35); \ 15250 \ 15251 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 15252 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 15253 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 15254 __ret; \ 15255 }) 15256 #endif 15257 15258 #ifdef __LITTLE_ENDIAN__ 15259 #define vld3q_dup_s16(__p0) __extension__ ({ \ 15260 int16x8x3_t __ret; \ 15261 __builtin_neon_vld3q_dup_v(&__ret, __p0, 33); \ 15262 __ret; \ 15263 }) 15264 #else 15265 #define vld3q_dup_s16(__p0) __extension__ ({ \ 15266 int16x8x3_t __ret; \ 15267 __builtin_neon_vld3q_dup_v(&__ret, __p0, 33); \ 15268 \ 15269 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 15270 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 15271 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 15272 __ret; \ 15273 }) 15274 #endif 15275 15276 #ifdef __LITTLE_ENDIAN__ 15277 #define vld3_dup_u8(__p0) __extension__ ({ \ 15278 uint8x8x3_t __ret; \ 15279 __builtin_neon_vld3_dup_v(&__ret, __p0, 16); \ 15280 __ret; \ 15281 }) 15282 #else 15283 #define vld3_dup_u8(__p0) __extension__ ({ \ 15284 uint8x8x3_t __ret; \ 15285 __builtin_neon_vld3_dup_v(&__ret, __p0, 16); \ 15286 \ 15287 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 15288 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 15289 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 15290 __ret; \ 15291 }) 15292 #endif 15293 15294 #ifdef __LITTLE_ENDIAN__ 15295 #define vld3_dup_u32(__p0) __extension__ ({ \ 15296 uint32x2x3_t __ret; \ 15297 __builtin_neon_vld3_dup_v(&__ret, __p0, 18); \ 15298 __ret; \ 15299 }) 15300 #else 15301 #define vld3_dup_u32(__p0) __extension__ ({ \ 15302 uint32x2x3_t __ret; \ 15303 __builtin_neon_vld3_dup_v(&__ret, __p0, 18); \ 15304 \ 15305 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 15306 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 15307 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 15308 __ret; \ 15309 }) 15310 #endif 15311 15312 #define vld3_dup_u64(__p0) __extension__ ({ \ 15313 uint64x1x3_t __ret; \ 15314 __builtin_neon_vld3_dup_v(&__ret, __p0, 19); \ 15315 __ret; \ 15316 }) 15317 #ifdef __LITTLE_ENDIAN__ 15318 #define vld3_dup_u16(__p0) __extension__ ({ \ 15319 uint16x4x3_t __ret; \ 15320 __builtin_neon_vld3_dup_v(&__ret, __p0, 17); \ 15321 __ret; \ 15322 }) 15323 #else 15324 #define vld3_dup_u16(__p0) __extension__ ({ \ 15325 uint16x4x3_t __ret; \ 15326 __builtin_neon_vld3_dup_v(&__ret, __p0, 17); \ 15327 \ 15328 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 15329 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 15330 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 15331 __ret; \ 15332 }) 15333 #endif 15334 15335 #ifdef __LITTLE_ENDIAN__ 15336 #define vld3_dup_s8(__p0) __extension__ ({ \ 15337 int8x8x3_t __ret; \ 15338 __builtin_neon_vld3_dup_v(&__ret, __p0, 0); \ 15339 __ret; \ 15340 }) 15341 #else 15342 #define vld3_dup_s8(__p0) __extension__ ({ \ 15343 int8x8x3_t __ret; \ 15344 __builtin_neon_vld3_dup_v(&__ret, __p0, 0); \ 15345 \ 15346 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 15347 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 15348 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 15349 __ret; \ 15350 }) 15351 #endif 15352 15353 #ifdef __LITTLE_ENDIAN__ 15354 #define vld3_dup_f32(__p0) __extension__ ({ \ 15355 float32x2x3_t __ret; \ 15356 __builtin_neon_vld3_dup_v(&__ret, __p0, 9); \ 15357 __ret; \ 15358 }) 15359 #else 15360 #define vld3_dup_f32(__p0) __extension__ ({ \ 15361 float32x2x3_t __ret; \ 15362 __builtin_neon_vld3_dup_v(&__ret, __p0, 9); \ 15363 \ 15364 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 15365 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 15366 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 15367 __ret; \ 15368 }) 15369 #endif 15370 15371 #ifdef __LITTLE_ENDIAN__ 15372 #define vld3_dup_s32(__p0) __extension__ ({ \ 15373 int32x2x3_t __ret; \ 15374 __builtin_neon_vld3_dup_v(&__ret, __p0, 2); \ 15375 __ret; \ 15376 }) 15377 #else 15378 #define vld3_dup_s32(__p0) __extension__ ({ \ 15379 int32x2x3_t __ret; \ 15380 __builtin_neon_vld3_dup_v(&__ret, __p0, 2); \ 15381 \ 15382 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 15383 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 15384 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 15385 __ret; \ 15386 }) 15387 #endif 15388 15389 #define vld3_dup_s64(__p0) __extension__ ({ \ 15390 int64x1x3_t __ret; \ 15391 __builtin_neon_vld3_dup_v(&__ret, __p0, 3); \ 15392 __ret; \ 15393 }) 15394 #ifdef __LITTLE_ENDIAN__ 15395 #define vld3_dup_s16(__p0) __extension__ ({ \ 15396 int16x4x3_t __ret; \ 15397 __builtin_neon_vld3_dup_v(&__ret, __p0, 1); \ 15398 __ret; \ 15399 }) 15400 #else 15401 #define vld3_dup_s16(__p0) __extension__ ({ \ 15402 int16x4x3_t __ret; \ 15403 __builtin_neon_vld3_dup_v(&__ret, __p0, 1); \ 15404 \ 15405 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 15406 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 15407 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 15408 __ret; \ 15409 }) 15410 #endif 15411 15412 #ifdef __LITTLE_ENDIAN__ 15413 #define vld3_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 15414 poly8x8x3_t __ret; \ 15415 poly8x8x3_t __s1 = __p1; \ 15416 __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 4); \ 15417 __ret; \ 15418 }) 15419 #else 15420 #define vld3_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 15421 poly8x8x3_t __ret; \ 15422 poly8x8x3_t __s1 = __p1; \ 15423 poly8x8x3_t __rev1; \ 15424 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 15425 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 15426 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 15427 __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 4); \ 15428 \ 15429 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 15430 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 15431 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 15432 __ret; \ 15433 }) 15434 #endif 15435 15436 #ifdef __LITTLE_ENDIAN__ 15437 #define vld3_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 15438 poly16x4x3_t __ret; \ 15439 poly16x4x3_t __s1 = __p1; \ 15440 __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 5); \ 15441 __ret; \ 15442 }) 15443 #else 15444 #define vld3_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 15445 poly16x4x3_t __ret; \ 15446 poly16x4x3_t __s1 = __p1; \ 15447 poly16x4x3_t __rev1; \ 15448 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 15449 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 15450 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 15451 __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 5); \ 15452 \ 15453 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 15454 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 15455 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 15456 __ret; \ 15457 }) 15458 #endif 15459 15460 #ifdef __LITTLE_ENDIAN__ 15461 #define vld3q_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 15462 poly16x8x3_t __ret; \ 15463 poly16x8x3_t __s1 = __p1; \ 15464 __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 37); \ 15465 __ret; \ 15466 }) 15467 #else 15468 #define vld3q_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 15469 poly16x8x3_t __ret; \ 15470 poly16x8x3_t __s1 = __p1; \ 15471 poly16x8x3_t __rev1; \ 15472 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 15473 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 15474 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 15475 __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 37); \ 15476 \ 15477 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 15478 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 15479 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 15480 __ret; \ 15481 }) 15482 #endif 15483 15484 #ifdef __LITTLE_ENDIAN__ 15485 #define vld3q_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 15486 uint32x4x3_t __ret; \ 15487 uint32x4x3_t __s1 = __p1; \ 15488 __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 50); \ 15489 __ret; \ 15490 }) 15491 #else 15492 #define vld3q_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 15493 uint32x4x3_t __ret; \ 15494 uint32x4x3_t __s1 = __p1; \ 15495 uint32x4x3_t __rev1; \ 15496 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 15497 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 15498 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 15499 __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 50); \ 15500 \ 15501 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 15502 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 15503 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 15504 __ret; \ 15505 }) 15506 #endif 15507 15508 #ifdef __LITTLE_ENDIAN__ 15509 #define vld3q_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 15510 uint16x8x3_t __ret; \ 15511 uint16x8x3_t __s1 = __p1; \ 15512 __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 49); \ 15513 __ret; \ 15514 }) 15515 #else 15516 #define vld3q_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 15517 uint16x8x3_t __ret; \ 15518 uint16x8x3_t __s1 = __p1; \ 15519 uint16x8x3_t __rev1; \ 15520 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 15521 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 15522 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 15523 __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 49); \ 15524 \ 15525 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 15526 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 15527 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 15528 __ret; \ 15529 }) 15530 #endif 15531 15532 #ifdef __LITTLE_ENDIAN__ 15533 #define vld3q_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 15534 float32x4x3_t __ret; \ 15535 float32x4x3_t __s1 = __p1; \ 15536 __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 41); \ 15537 __ret; \ 15538 }) 15539 #else 15540 #define vld3q_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 15541 float32x4x3_t __ret; \ 15542 float32x4x3_t __s1 = __p1; \ 15543 float32x4x3_t __rev1; \ 15544 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 15545 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 15546 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 15547 __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 41); \ 15548 \ 15549 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 15550 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 15551 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 15552 __ret; \ 15553 }) 15554 #endif 15555 15556 #ifdef __LITTLE_ENDIAN__ 15557 #define vld3q_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 15558 int32x4x3_t __ret; \ 15559 int32x4x3_t __s1 = __p1; \ 15560 __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 34); \ 15561 __ret; \ 15562 }) 15563 #else 15564 #define vld3q_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 15565 int32x4x3_t __ret; \ 15566 int32x4x3_t __s1 = __p1; \ 15567 int32x4x3_t __rev1; \ 15568 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 15569 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 15570 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 15571 __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 34); \ 15572 \ 15573 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 15574 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 15575 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 15576 __ret; \ 15577 }) 15578 #endif 15579 15580 #ifdef __LITTLE_ENDIAN__ 15581 #define vld3q_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 15582 int16x8x3_t __ret; \ 15583 int16x8x3_t __s1 = __p1; \ 15584 __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 33); \ 15585 __ret; \ 15586 }) 15587 #else 15588 #define vld3q_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 15589 int16x8x3_t __ret; \ 15590 int16x8x3_t __s1 = __p1; \ 15591 int16x8x3_t __rev1; \ 15592 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 15593 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 15594 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 15595 __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 33); \ 15596 \ 15597 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 15598 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 15599 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 15600 __ret; \ 15601 }) 15602 #endif 15603 15604 #ifdef __LITTLE_ENDIAN__ 15605 #define vld3_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 15606 uint8x8x3_t __ret; \ 15607 uint8x8x3_t __s1 = __p1; \ 15608 __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 16); \ 15609 __ret; \ 15610 }) 15611 #else 15612 #define vld3_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 15613 uint8x8x3_t __ret; \ 15614 uint8x8x3_t __s1 = __p1; \ 15615 uint8x8x3_t __rev1; \ 15616 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 15617 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 15618 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 15619 __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 16); \ 15620 \ 15621 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 15622 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 15623 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 15624 __ret; \ 15625 }) 15626 #endif 15627 15628 #ifdef __LITTLE_ENDIAN__ 15629 #define vld3_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 15630 uint32x2x3_t __ret; \ 15631 uint32x2x3_t __s1 = __p1; \ 15632 __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 18); \ 15633 __ret; \ 15634 }) 15635 #else 15636 #define vld3_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 15637 uint32x2x3_t __ret; \ 15638 uint32x2x3_t __s1 = __p1; \ 15639 uint32x2x3_t __rev1; \ 15640 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 15641 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 15642 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 15643 __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 18); \ 15644 \ 15645 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 15646 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 15647 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 15648 __ret; \ 15649 }) 15650 #endif 15651 15652 #ifdef __LITTLE_ENDIAN__ 15653 #define vld3_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 15654 uint16x4x3_t __ret; \ 15655 uint16x4x3_t __s1 = __p1; \ 15656 __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 17); \ 15657 __ret; \ 15658 }) 15659 #else 15660 #define vld3_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 15661 uint16x4x3_t __ret; \ 15662 uint16x4x3_t __s1 = __p1; \ 15663 uint16x4x3_t __rev1; \ 15664 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 15665 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 15666 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 15667 __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 17); \ 15668 \ 15669 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 15670 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 15671 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 15672 __ret; \ 15673 }) 15674 #endif 15675 15676 #ifdef __LITTLE_ENDIAN__ 15677 #define vld3_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 15678 int8x8x3_t __ret; \ 15679 int8x8x3_t __s1 = __p1; \ 15680 __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 0); \ 15681 __ret; \ 15682 }) 15683 #else 15684 #define vld3_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 15685 int8x8x3_t __ret; \ 15686 int8x8x3_t __s1 = __p1; \ 15687 int8x8x3_t __rev1; \ 15688 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 15689 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 15690 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 15691 __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 0); \ 15692 \ 15693 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 15694 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 15695 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 15696 __ret; \ 15697 }) 15698 #endif 15699 15700 #ifdef __LITTLE_ENDIAN__ 15701 #define vld3_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 15702 float32x2x3_t __ret; \ 15703 float32x2x3_t __s1 = __p1; \ 15704 __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 9); \ 15705 __ret; \ 15706 }) 15707 #else 15708 #define vld3_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 15709 float32x2x3_t __ret; \ 15710 float32x2x3_t __s1 = __p1; \ 15711 float32x2x3_t __rev1; \ 15712 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 15713 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 15714 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 15715 __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 9); \ 15716 \ 15717 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 15718 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 15719 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 15720 __ret; \ 15721 }) 15722 #endif 15723 15724 #ifdef __LITTLE_ENDIAN__ 15725 #define vld3_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 15726 int32x2x3_t __ret; \ 15727 int32x2x3_t __s1 = __p1; \ 15728 __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 2); \ 15729 __ret; \ 15730 }) 15731 #else 15732 #define vld3_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 15733 int32x2x3_t __ret; \ 15734 int32x2x3_t __s1 = __p1; \ 15735 int32x2x3_t __rev1; \ 15736 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 15737 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 15738 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 15739 __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 2); \ 15740 \ 15741 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 15742 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 15743 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 15744 __ret; \ 15745 }) 15746 #endif 15747 15748 #ifdef __LITTLE_ENDIAN__ 15749 #define vld3_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 15750 int16x4x3_t __ret; \ 15751 int16x4x3_t __s1 = __p1; \ 15752 __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 1); \ 15753 __ret; \ 15754 }) 15755 #else 15756 #define vld3_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 15757 int16x4x3_t __ret; \ 15758 int16x4x3_t __s1 = __p1; \ 15759 int16x4x3_t __rev1; \ 15760 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 15761 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 15762 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 15763 __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 1); \ 15764 \ 15765 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 15766 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 15767 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 15768 __ret; \ 15769 }) 15770 #endif 15771 15772 #ifdef __LITTLE_ENDIAN__ 15773 #define vld4_p8(__p0) __extension__ ({ \ 15774 poly8x8x4_t __ret; \ 15775 __builtin_neon_vld4_v(&__ret, __p0, 4); \ 15776 __ret; \ 15777 }) 15778 #else 15779 #define vld4_p8(__p0) __extension__ ({ \ 15780 poly8x8x4_t __ret; \ 15781 __builtin_neon_vld4_v(&__ret, __p0, 4); \ 15782 \ 15783 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 15784 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 15785 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 15786 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 15787 __ret; \ 15788 }) 15789 #endif 15790 15791 #ifdef __LITTLE_ENDIAN__ 15792 #define vld4_p16(__p0) __extension__ ({ \ 15793 poly16x4x4_t __ret; \ 15794 __builtin_neon_vld4_v(&__ret, __p0, 5); \ 15795 __ret; \ 15796 }) 15797 #else 15798 #define vld4_p16(__p0) __extension__ ({ \ 15799 poly16x4x4_t __ret; \ 15800 __builtin_neon_vld4_v(&__ret, __p0, 5); \ 15801 \ 15802 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 15803 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 15804 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 15805 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \ 15806 __ret; \ 15807 }) 15808 #endif 15809 15810 #ifdef __LITTLE_ENDIAN__ 15811 #define vld4q_p8(__p0) __extension__ ({ \ 15812 poly8x16x4_t __ret; \ 15813 __builtin_neon_vld4q_v(&__ret, __p0, 36); \ 15814 __ret; \ 15815 }) 15816 #else 15817 #define vld4q_p8(__p0) __extension__ ({ \ 15818 poly8x16x4_t __ret; \ 15819 __builtin_neon_vld4q_v(&__ret, __p0, 36); \ 15820 \ 15821 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 15822 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 15823 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 15824 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 15825 __ret; \ 15826 }) 15827 #endif 15828 15829 #ifdef __LITTLE_ENDIAN__ 15830 #define vld4q_p16(__p0) __extension__ ({ \ 15831 poly16x8x4_t __ret; \ 15832 __builtin_neon_vld4q_v(&__ret, __p0, 37); \ 15833 __ret; \ 15834 }) 15835 #else 15836 #define vld4q_p16(__p0) __extension__ ({ \ 15837 poly16x8x4_t __ret; \ 15838 __builtin_neon_vld4q_v(&__ret, __p0, 37); \ 15839 \ 15840 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 15841 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 15842 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 15843 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 15844 __ret; \ 15845 }) 15846 #endif 15847 15848 #ifdef __LITTLE_ENDIAN__ 15849 #define vld4q_u8(__p0) __extension__ ({ \ 15850 uint8x16x4_t __ret; \ 15851 __builtin_neon_vld4q_v(&__ret, __p0, 48); \ 15852 __ret; \ 15853 }) 15854 #else 15855 #define vld4q_u8(__p0) __extension__ ({ \ 15856 uint8x16x4_t __ret; \ 15857 __builtin_neon_vld4q_v(&__ret, __p0, 48); \ 15858 \ 15859 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 15860 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 15861 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 15862 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 15863 __ret; \ 15864 }) 15865 #endif 15866 15867 #ifdef __LITTLE_ENDIAN__ 15868 #define vld4q_u32(__p0) __extension__ ({ \ 15869 uint32x4x4_t __ret; \ 15870 __builtin_neon_vld4q_v(&__ret, __p0, 50); \ 15871 __ret; \ 15872 }) 15873 #else 15874 #define vld4q_u32(__p0) __extension__ ({ \ 15875 uint32x4x4_t __ret; \ 15876 __builtin_neon_vld4q_v(&__ret, __p0, 50); \ 15877 \ 15878 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 15879 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 15880 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 15881 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \ 15882 __ret; \ 15883 }) 15884 #endif 15885 15886 #ifdef __LITTLE_ENDIAN__ 15887 #define vld4q_u16(__p0) __extension__ ({ \ 15888 uint16x8x4_t __ret; \ 15889 __builtin_neon_vld4q_v(&__ret, __p0, 49); \ 15890 __ret; \ 15891 }) 15892 #else 15893 #define vld4q_u16(__p0) __extension__ ({ \ 15894 uint16x8x4_t __ret; \ 15895 __builtin_neon_vld4q_v(&__ret, __p0, 49); \ 15896 \ 15897 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 15898 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 15899 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 15900 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 15901 __ret; \ 15902 }) 15903 #endif 15904 15905 #ifdef __LITTLE_ENDIAN__ 15906 #define vld4q_s8(__p0) __extension__ ({ \ 15907 int8x16x4_t __ret; \ 15908 __builtin_neon_vld4q_v(&__ret, __p0, 32); \ 15909 __ret; \ 15910 }) 15911 #else 15912 #define vld4q_s8(__p0) __extension__ ({ \ 15913 int8x16x4_t __ret; \ 15914 __builtin_neon_vld4q_v(&__ret, __p0, 32); \ 15915 \ 15916 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 15917 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 15918 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 15919 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 15920 __ret; \ 15921 }) 15922 #endif 15923 15924 #ifdef __LITTLE_ENDIAN__ 15925 #define vld4q_f32(__p0) __extension__ ({ \ 15926 float32x4x4_t __ret; \ 15927 __builtin_neon_vld4q_v(&__ret, __p0, 41); \ 15928 __ret; \ 15929 }) 15930 #else 15931 #define vld4q_f32(__p0) __extension__ ({ \ 15932 float32x4x4_t __ret; \ 15933 __builtin_neon_vld4q_v(&__ret, __p0, 41); \ 15934 \ 15935 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 15936 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 15937 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 15938 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \ 15939 __ret; \ 15940 }) 15941 #endif 15942 15943 #ifdef __LITTLE_ENDIAN__ 15944 #define vld4q_s32(__p0) __extension__ ({ \ 15945 int32x4x4_t __ret; \ 15946 __builtin_neon_vld4q_v(&__ret, __p0, 34); \ 15947 __ret; \ 15948 }) 15949 #else 15950 #define vld4q_s32(__p0) __extension__ ({ \ 15951 int32x4x4_t __ret; \ 15952 __builtin_neon_vld4q_v(&__ret, __p0, 34); \ 15953 \ 15954 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 15955 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 15956 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 15957 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \ 15958 __ret; \ 15959 }) 15960 #endif 15961 15962 #ifdef __LITTLE_ENDIAN__ 15963 #define vld4q_s16(__p0) __extension__ ({ \ 15964 int16x8x4_t __ret; \ 15965 __builtin_neon_vld4q_v(&__ret, __p0, 33); \ 15966 __ret; \ 15967 }) 15968 #else 15969 #define vld4q_s16(__p0) __extension__ ({ \ 15970 int16x8x4_t __ret; \ 15971 __builtin_neon_vld4q_v(&__ret, __p0, 33); \ 15972 \ 15973 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 15974 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 15975 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 15976 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 15977 __ret; \ 15978 }) 15979 #endif 15980 15981 #ifdef __LITTLE_ENDIAN__ 15982 #define vld4_u8(__p0) __extension__ ({ \ 15983 uint8x8x4_t __ret; \ 15984 __builtin_neon_vld4_v(&__ret, __p0, 16); \ 15985 __ret; \ 15986 }) 15987 #else 15988 #define vld4_u8(__p0) __extension__ ({ \ 15989 uint8x8x4_t __ret; \ 15990 __builtin_neon_vld4_v(&__ret, __p0, 16); \ 15991 \ 15992 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 15993 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 15994 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 15995 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 15996 __ret; \ 15997 }) 15998 #endif 15999 16000 #ifdef __LITTLE_ENDIAN__ 16001 #define vld4_u32(__p0) __extension__ ({ \ 16002 uint32x2x4_t __ret; \ 16003 __builtin_neon_vld4_v(&__ret, __p0, 18); \ 16004 __ret; \ 16005 }) 16006 #else 16007 #define vld4_u32(__p0) __extension__ ({ \ 16008 uint32x2x4_t __ret; \ 16009 __builtin_neon_vld4_v(&__ret, __p0, 18); \ 16010 \ 16011 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 16012 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 16013 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 16014 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \ 16015 __ret; \ 16016 }) 16017 #endif 16018 16019 #define vld4_u64(__p0) __extension__ ({ \ 16020 uint64x1x4_t __ret; \ 16021 __builtin_neon_vld4_v(&__ret, __p0, 19); \ 16022 __ret; \ 16023 }) 16024 #ifdef __LITTLE_ENDIAN__ 16025 #define vld4_u16(__p0) __extension__ ({ \ 16026 uint16x4x4_t __ret; \ 16027 __builtin_neon_vld4_v(&__ret, __p0, 17); \ 16028 __ret; \ 16029 }) 16030 #else 16031 #define vld4_u16(__p0) __extension__ ({ \ 16032 uint16x4x4_t __ret; \ 16033 __builtin_neon_vld4_v(&__ret, __p0, 17); \ 16034 \ 16035 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 16036 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 16037 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 16038 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \ 16039 __ret; \ 16040 }) 16041 #endif 16042 16043 #ifdef __LITTLE_ENDIAN__ 16044 #define vld4_s8(__p0) __extension__ ({ \ 16045 int8x8x4_t __ret; \ 16046 __builtin_neon_vld4_v(&__ret, __p0, 0); \ 16047 __ret; \ 16048 }) 16049 #else 16050 #define vld4_s8(__p0) __extension__ ({ \ 16051 int8x8x4_t __ret; \ 16052 __builtin_neon_vld4_v(&__ret, __p0, 0); \ 16053 \ 16054 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 16055 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 16056 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 16057 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 16058 __ret; \ 16059 }) 16060 #endif 16061 16062 #ifdef __LITTLE_ENDIAN__ 16063 #define vld4_f32(__p0) __extension__ ({ \ 16064 float32x2x4_t __ret; \ 16065 __builtin_neon_vld4_v(&__ret, __p0, 9); \ 16066 __ret; \ 16067 }) 16068 #else 16069 #define vld4_f32(__p0) __extension__ ({ \ 16070 float32x2x4_t __ret; \ 16071 __builtin_neon_vld4_v(&__ret, __p0, 9); \ 16072 \ 16073 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 16074 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 16075 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 16076 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \ 16077 __ret; \ 16078 }) 16079 #endif 16080 16081 #ifdef __LITTLE_ENDIAN__ 16082 #define vld4_s32(__p0) __extension__ ({ \ 16083 int32x2x4_t __ret; \ 16084 __builtin_neon_vld4_v(&__ret, __p0, 2); \ 16085 __ret; \ 16086 }) 16087 #else 16088 #define vld4_s32(__p0) __extension__ ({ \ 16089 int32x2x4_t __ret; \ 16090 __builtin_neon_vld4_v(&__ret, __p0, 2); \ 16091 \ 16092 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 16093 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 16094 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 16095 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \ 16096 __ret; \ 16097 }) 16098 #endif 16099 16100 #define vld4_s64(__p0) __extension__ ({ \ 16101 int64x1x4_t __ret; \ 16102 __builtin_neon_vld4_v(&__ret, __p0, 3); \ 16103 __ret; \ 16104 }) 16105 #ifdef __LITTLE_ENDIAN__ 16106 #define vld4_s16(__p0) __extension__ ({ \ 16107 int16x4x4_t __ret; \ 16108 __builtin_neon_vld4_v(&__ret, __p0, 1); \ 16109 __ret; \ 16110 }) 16111 #else 16112 #define vld4_s16(__p0) __extension__ ({ \ 16113 int16x4x4_t __ret; \ 16114 __builtin_neon_vld4_v(&__ret, __p0, 1); \ 16115 \ 16116 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 16117 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 16118 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 16119 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \ 16120 __ret; \ 16121 }) 16122 #endif 16123 16124 #ifdef __LITTLE_ENDIAN__ 16125 #define vld4_dup_p8(__p0) __extension__ ({ \ 16126 poly8x8x4_t __ret; \ 16127 __builtin_neon_vld4_dup_v(&__ret, __p0, 4); \ 16128 __ret; \ 16129 }) 16130 #else 16131 #define vld4_dup_p8(__p0) __extension__ ({ \ 16132 poly8x8x4_t __ret; \ 16133 __builtin_neon_vld4_dup_v(&__ret, __p0, 4); \ 16134 \ 16135 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 16136 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 16137 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 16138 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 16139 __ret; \ 16140 }) 16141 #endif 16142 16143 #ifdef __LITTLE_ENDIAN__ 16144 #define vld4_dup_p16(__p0) __extension__ ({ \ 16145 poly16x4x4_t __ret; \ 16146 __builtin_neon_vld4_dup_v(&__ret, __p0, 5); \ 16147 __ret; \ 16148 }) 16149 #else 16150 #define vld4_dup_p16(__p0) __extension__ ({ \ 16151 poly16x4x4_t __ret; \ 16152 __builtin_neon_vld4_dup_v(&__ret, __p0, 5); \ 16153 \ 16154 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 16155 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 16156 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 16157 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \ 16158 __ret; \ 16159 }) 16160 #endif 16161 16162 #ifdef __LITTLE_ENDIAN__ 16163 #define vld4q_dup_p8(__p0) __extension__ ({ \ 16164 poly8x16x4_t __ret; \ 16165 __builtin_neon_vld4q_dup_v(&__ret, __p0, 36); \ 16166 __ret; \ 16167 }) 16168 #else 16169 #define vld4q_dup_p8(__p0) __extension__ ({ \ 16170 poly8x16x4_t __ret; \ 16171 __builtin_neon_vld4q_dup_v(&__ret, __p0, 36); \ 16172 \ 16173 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 16174 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 16175 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 16176 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 16177 __ret; \ 16178 }) 16179 #endif 16180 16181 #ifdef __LITTLE_ENDIAN__ 16182 #define vld4q_dup_p16(__p0) __extension__ ({ \ 16183 poly16x8x4_t __ret; \ 16184 __builtin_neon_vld4q_dup_v(&__ret, __p0, 37); \ 16185 __ret; \ 16186 }) 16187 #else 16188 #define vld4q_dup_p16(__p0) __extension__ ({ \ 16189 poly16x8x4_t __ret; \ 16190 __builtin_neon_vld4q_dup_v(&__ret, __p0, 37); \ 16191 \ 16192 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 16193 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 16194 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 16195 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 16196 __ret; \ 16197 }) 16198 #endif 16199 16200 #ifdef __LITTLE_ENDIAN__ 16201 #define vld4q_dup_u8(__p0) __extension__ ({ \ 16202 uint8x16x4_t __ret; \ 16203 __builtin_neon_vld4q_dup_v(&__ret, __p0, 48); \ 16204 __ret; \ 16205 }) 16206 #else 16207 #define vld4q_dup_u8(__p0) __extension__ ({ \ 16208 uint8x16x4_t __ret; \ 16209 __builtin_neon_vld4q_dup_v(&__ret, __p0, 48); \ 16210 \ 16211 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 16212 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 16213 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 16214 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 16215 __ret; \ 16216 }) 16217 #endif 16218 16219 #ifdef __LITTLE_ENDIAN__ 16220 #define vld4q_dup_u32(__p0) __extension__ ({ \ 16221 uint32x4x4_t __ret; \ 16222 __builtin_neon_vld4q_dup_v(&__ret, __p0, 50); \ 16223 __ret; \ 16224 }) 16225 #else 16226 #define vld4q_dup_u32(__p0) __extension__ ({ \ 16227 uint32x4x4_t __ret; \ 16228 __builtin_neon_vld4q_dup_v(&__ret, __p0, 50); \ 16229 \ 16230 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 16231 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 16232 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 16233 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \ 16234 __ret; \ 16235 }) 16236 #endif 16237 16238 #ifdef __LITTLE_ENDIAN__ 16239 #define vld4q_dup_u64(__p0) __extension__ ({ \ 16240 uint64x2x4_t __ret; \ 16241 __builtin_neon_vld4q_dup_v(&__ret, __p0, 51); \ 16242 __ret; \ 16243 }) 16244 #else 16245 #define vld4q_dup_u64(__p0) __extension__ ({ \ 16246 uint64x2x4_t __ret; \ 16247 __builtin_neon_vld4q_dup_v(&__ret, __p0, 51); \ 16248 \ 16249 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 16250 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 16251 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 16252 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \ 16253 __ret; \ 16254 }) 16255 #endif 16256 16257 #ifdef __LITTLE_ENDIAN__ 16258 #define vld4q_dup_u16(__p0) __extension__ ({ \ 16259 uint16x8x4_t __ret; \ 16260 __builtin_neon_vld4q_dup_v(&__ret, __p0, 49); \ 16261 __ret; \ 16262 }) 16263 #else 16264 #define vld4q_dup_u16(__p0) __extension__ ({ \ 16265 uint16x8x4_t __ret; \ 16266 __builtin_neon_vld4q_dup_v(&__ret, __p0, 49); \ 16267 \ 16268 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 16269 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 16270 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 16271 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 16272 __ret; \ 16273 }) 16274 #endif 16275 16276 #ifdef __LITTLE_ENDIAN__ 16277 #define vld4q_dup_s8(__p0) __extension__ ({ \ 16278 int8x16x4_t __ret; \ 16279 __builtin_neon_vld4q_dup_v(&__ret, __p0, 32); \ 16280 __ret; \ 16281 }) 16282 #else 16283 #define vld4q_dup_s8(__p0) __extension__ ({ \ 16284 int8x16x4_t __ret; \ 16285 __builtin_neon_vld4q_dup_v(&__ret, __p0, 32); \ 16286 \ 16287 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 16288 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 16289 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 16290 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 16291 __ret; \ 16292 }) 16293 #endif 16294 16295 #ifdef __LITTLE_ENDIAN__ 16296 #define vld4q_dup_f32(__p0) __extension__ ({ \ 16297 float32x4x4_t __ret; \ 16298 __builtin_neon_vld4q_dup_v(&__ret, __p0, 41); \ 16299 __ret; \ 16300 }) 16301 #else 16302 #define vld4q_dup_f32(__p0) __extension__ ({ \ 16303 float32x4x4_t __ret; \ 16304 __builtin_neon_vld4q_dup_v(&__ret, __p0, 41); \ 16305 \ 16306 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 16307 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 16308 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 16309 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \ 16310 __ret; \ 16311 }) 16312 #endif 16313 16314 #ifdef __LITTLE_ENDIAN__ 16315 #define vld4q_dup_s32(__p0) __extension__ ({ \ 16316 int32x4x4_t __ret; \ 16317 __builtin_neon_vld4q_dup_v(&__ret, __p0, 34); \ 16318 __ret; \ 16319 }) 16320 #else 16321 #define vld4q_dup_s32(__p0) __extension__ ({ \ 16322 int32x4x4_t __ret; \ 16323 __builtin_neon_vld4q_dup_v(&__ret, __p0, 34); \ 16324 \ 16325 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 16326 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 16327 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 16328 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \ 16329 __ret; \ 16330 }) 16331 #endif 16332 16333 #ifdef __LITTLE_ENDIAN__ 16334 #define vld4q_dup_s64(__p0) __extension__ ({ \ 16335 int64x2x4_t __ret; \ 16336 __builtin_neon_vld4q_dup_v(&__ret, __p0, 35); \ 16337 __ret; \ 16338 }) 16339 #else 16340 #define vld4q_dup_s64(__p0) __extension__ ({ \ 16341 int64x2x4_t __ret; \ 16342 __builtin_neon_vld4q_dup_v(&__ret, __p0, 35); \ 16343 \ 16344 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 16345 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 16346 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 16347 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \ 16348 __ret; \ 16349 }) 16350 #endif 16351 16352 #ifdef __LITTLE_ENDIAN__ 16353 #define vld4q_dup_s16(__p0) __extension__ ({ \ 16354 int16x8x4_t __ret; \ 16355 __builtin_neon_vld4q_dup_v(&__ret, __p0, 33); \ 16356 __ret; \ 16357 }) 16358 #else 16359 #define vld4q_dup_s16(__p0) __extension__ ({ \ 16360 int16x8x4_t __ret; \ 16361 __builtin_neon_vld4q_dup_v(&__ret, __p0, 33); \ 16362 \ 16363 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 16364 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 16365 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 16366 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 16367 __ret; \ 16368 }) 16369 #endif 16370 16371 #ifdef __LITTLE_ENDIAN__ 16372 #define vld4_dup_u8(__p0) __extension__ ({ \ 16373 uint8x8x4_t __ret; \ 16374 __builtin_neon_vld4_dup_v(&__ret, __p0, 16); \ 16375 __ret; \ 16376 }) 16377 #else 16378 #define vld4_dup_u8(__p0) __extension__ ({ \ 16379 uint8x8x4_t __ret; \ 16380 __builtin_neon_vld4_dup_v(&__ret, __p0, 16); \ 16381 \ 16382 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 16383 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 16384 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 16385 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 16386 __ret; \ 16387 }) 16388 #endif 16389 16390 #ifdef __LITTLE_ENDIAN__ 16391 #define vld4_dup_u32(__p0) __extension__ ({ \ 16392 uint32x2x4_t __ret; \ 16393 __builtin_neon_vld4_dup_v(&__ret, __p0, 18); \ 16394 __ret; \ 16395 }) 16396 #else 16397 #define vld4_dup_u32(__p0) __extension__ ({ \ 16398 uint32x2x4_t __ret; \ 16399 __builtin_neon_vld4_dup_v(&__ret, __p0, 18); \ 16400 \ 16401 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 16402 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 16403 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 16404 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \ 16405 __ret; \ 16406 }) 16407 #endif 16408 16409 #define vld4_dup_u64(__p0) __extension__ ({ \ 16410 uint64x1x4_t __ret; \ 16411 __builtin_neon_vld4_dup_v(&__ret, __p0, 19); \ 16412 __ret; \ 16413 }) 16414 #ifdef __LITTLE_ENDIAN__ 16415 #define vld4_dup_u16(__p0) __extension__ ({ \ 16416 uint16x4x4_t __ret; \ 16417 __builtin_neon_vld4_dup_v(&__ret, __p0, 17); \ 16418 __ret; \ 16419 }) 16420 #else 16421 #define vld4_dup_u16(__p0) __extension__ ({ \ 16422 uint16x4x4_t __ret; \ 16423 __builtin_neon_vld4_dup_v(&__ret, __p0, 17); \ 16424 \ 16425 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 16426 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 16427 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 16428 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \ 16429 __ret; \ 16430 }) 16431 #endif 16432 16433 #ifdef __LITTLE_ENDIAN__ 16434 #define vld4_dup_s8(__p0) __extension__ ({ \ 16435 int8x8x4_t __ret; \ 16436 __builtin_neon_vld4_dup_v(&__ret, __p0, 0); \ 16437 __ret; \ 16438 }) 16439 #else 16440 #define vld4_dup_s8(__p0) __extension__ ({ \ 16441 int8x8x4_t __ret; \ 16442 __builtin_neon_vld4_dup_v(&__ret, __p0, 0); \ 16443 \ 16444 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 16445 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 16446 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 16447 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 16448 __ret; \ 16449 }) 16450 #endif 16451 16452 #ifdef __LITTLE_ENDIAN__ 16453 #define vld4_dup_f32(__p0) __extension__ ({ \ 16454 float32x2x4_t __ret; \ 16455 __builtin_neon_vld4_dup_v(&__ret, __p0, 9); \ 16456 __ret; \ 16457 }) 16458 #else 16459 #define vld4_dup_f32(__p0) __extension__ ({ \ 16460 float32x2x4_t __ret; \ 16461 __builtin_neon_vld4_dup_v(&__ret, __p0, 9); \ 16462 \ 16463 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 16464 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 16465 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 16466 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \ 16467 __ret; \ 16468 }) 16469 #endif 16470 16471 #ifdef __LITTLE_ENDIAN__ 16472 #define vld4_dup_s32(__p0) __extension__ ({ \ 16473 int32x2x4_t __ret; \ 16474 __builtin_neon_vld4_dup_v(&__ret, __p0, 2); \ 16475 __ret; \ 16476 }) 16477 #else 16478 #define vld4_dup_s32(__p0) __extension__ ({ \ 16479 int32x2x4_t __ret; \ 16480 __builtin_neon_vld4_dup_v(&__ret, __p0, 2); \ 16481 \ 16482 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 16483 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 16484 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 16485 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \ 16486 __ret; \ 16487 }) 16488 #endif 16489 16490 #define vld4_dup_s64(__p0) __extension__ ({ \ 16491 int64x1x4_t __ret; \ 16492 __builtin_neon_vld4_dup_v(&__ret, __p0, 3); \ 16493 __ret; \ 16494 }) 16495 #ifdef __LITTLE_ENDIAN__ 16496 #define vld4_dup_s16(__p0) __extension__ ({ \ 16497 int16x4x4_t __ret; \ 16498 __builtin_neon_vld4_dup_v(&__ret, __p0, 1); \ 16499 __ret; \ 16500 }) 16501 #else 16502 #define vld4_dup_s16(__p0) __extension__ ({ \ 16503 int16x4x4_t __ret; \ 16504 __builtin_neon_vld4_dup_v(&__ret, __p0, 1); \ 16505 \ 16506 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 16507 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 16508 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 16509 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \ 16510 __ret; \ 16511 }) 16512 #endif 16513 16514 #ifdef __LITTLE_ENDIAN__ 16515 #define vld4_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 16516 poly8x8x4_t __ret; \ 16517 poly8x8x4_t __s1 = __p1; \ 16518 __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 4); \ 16519 __ret; \ 16520 }) 16521 #else 16522 #define vld4_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 16523 poly8x8x4_t __ret; \ 16524 poly8x8x4_t __s1 = __p1; \ 16525 poly8x8x4_t __rev1; \ 16526 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 16527 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 16528 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 16529 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 16530 __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 4); \ 16531 \ 16532 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 16533 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 16534 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 16535 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 16536 __ret; \ 16537 }) 16538 #endif 16539 16540 #ifdef __LITTLE_ENDIAN__ 16541 #define vld4_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 16542 poly16x4x4_t __ret; \ 16543 poly16x4x4_t __s1 = __p1; \ 16544 __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 5); \ 16545 __ret; \ 16546 }) 16547 #else 16548 #define vld4_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 16549 poly16x4x4_t __ret; \ 16550 poly16x4x4_t __s1 = __p1; \ 16551 poly16x4x4_t __rev1; \ 16552 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 16553 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 16554 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 16555 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \ 16556 __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 5); \ 16557 \ 16558 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 16559 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 16560 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 16561 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \ 16562 __ret; \ 16563 }) 16564 #endif 16565 16566 #ifdef __LITTLE_ENDIAN__ 16567 #define vld4q_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 16568 poly16x8x4_t __ret; \ 16569 poly16x8x4_t __s1 = __p1; \ 16570 __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 37); \ 16571 __ret; \ 16572 }) 16573 #else 16574 #define vld4q_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 16575 poly16x8x4_t __ret; \ 16576 poly16x8x4_t __s1 = __p1; \ 16577 poly16x8x4_t __rev1; \ 16578 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 16579 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 16580 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 16581 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 16582 __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 37); \ 16583 \ 16584 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 16585 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 16586 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 16587 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 16588 __ret; \ 16589 }) 16590 #endif 16591 16592 #ifdef __LITTLE_ENDIAN__ 16593 #define vld4q_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 16594 uint32x4x4_t __ret; \ 16595 uint32x4x4_t __s1 = __p1; \ 16596 __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 50); \ 16597 __ret; \ 16598 }) 16599 #else 16600 #define vld4q_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 16601 uint32x4x4_t __ret; \ 16602 uint32x4x4_t __s1 = __p1; \ 16603 uint32x4x4_t __rev1; \ 16604 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 16605 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 16606 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 16607 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \ 16608 __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 50); \ 16609 \ 16610 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 16611 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 16612 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 16613 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \ 16614 __ret; \ 16615 }) 16616 #endif 16617 16618 #ifdef __LITTLE_ENDIAN__ 16619 #define vld4q_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 16620 uint16x8x4_t __ret; \ 16621 uint16x8x4_t __s1 = __p1; \ 16622 __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 49); \ 16623 __ret; \ 16624 }) 16625 #else 16626 #define vld4q_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 16627 uint16x8x4_t __ret; \ 16628 uint16x8x4_t __s1 = __p1; \ 16629 uint16x8x4_t __rev1; \ 16630 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 16631 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 16632 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 16633 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 16634 __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 49); \ 16635 \ 16636 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 16637 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 16638 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 16639 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 16640 __ret; \ 16641 }) 16642 #endif 16643 16644 #ifdef __LITTLE_ENDIAN__ 16645 #define vld4q_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 16646 float32x4x4_t __ret; \ 16647 float32x4x4_t __s1 = __p1; \ 16648 __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 41); \ 16649 __ret; \ 16650 }) 16651 #else 16652 #define vld4q_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 16653 float32x4x4_t __ret; \ 16654 float32x4x4_t __s1 = __p1; \ 16655 float32x4x4_t __rev1; \ 16656 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 16657 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 16658 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 16659 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \ 16660 __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 41); \ 16661 \ 16662 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 16663 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 16664 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 16665 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \ 16666 __ret; \ 16667 }) 16668 #endif 16669 16670 #ifdef __LITTLE_ENDIAN__ 16671 #define vld4q_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 16672 int32x4x4_t __ret; \ 16673 int32x4x4_t __s1 = __p1; \ 16674 __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 34); \ 16675 __ret; \ 16676 }) 16677 #else 16678 #define vld4q_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 16679 int32x4x4_t __ret; \ 16680 int32x4x4_t __s1 = __p1; \ 16681 int32x4x4_t __rev1; \ 16682 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 16683 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 16684 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 16685 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \ 16686 __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 34); \ 16687 \ 16688 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 16689 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 16690 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 16691 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \ 16692 __ret; \ 16693 }) 16694 #endif 16695 16696 #ifdef __LITTLE_ENDIAN__ 16697 #define vld4q_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 16698 int16x8x4_t __ret; \ 16699 int16x8x4_t __s1 = __p1; \ 16700 __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 33); \ 16701 __ret; \ 16702 }) 16703 #else 16704 #define vld4q_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 16705 int16x8x4_t __ret; \ 16706 int16x8x4_t __s1 = __p1; \ 16707 int16x8x4_t __rev1; \ 16708 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 16709 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 16710 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 16711 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 16712 __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 33); \ 16713 \ 16714 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 16715 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 16716 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 16717 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 16718 __ret; \ 16719 }) 16720 #endif 16721 16722 #ifdef __LITTLE_ENDIAN__ 16723 #define vld4_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 16724 uint8x8x4_t __ret; \ 16725 uint8x8x4_t __s1 = __p1; \ 16726 __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 16); \ 16727 __ret; \ 16728 }) 16729 #else 16730 #define vld4_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 16731 uint8x8x4_t __ret; \ 16732 uint8x8x4_t __s1 = __p1; \ 16733 uint8x8x4_t __rev1; \ 16734 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 16735 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 16736 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 16737 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 16738 __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 16); \ 16739 \ 16740 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 16741 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 16742 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 16743 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 16744 __ret; \ 16745 }) 16746 #endif 16747 16748 #ifdef __LITTLE_ENDIAN__ 16749 #define vld4_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 16750 uint32x2x4_t __ret; \ 16751 uint32x2x4_t __s1 = __p1; \ 16752 __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 18); \ 16753 __ret; \ 16754 }) 16755 #else 16756 #define vld4_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 16757 uint32x2x4_t __ret; \ 16758 uint32x2x4_t __s1 = __p1; \ 16759 uint32x2x4_t __rev1; \ 16760 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 16761 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 16762 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 16763 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \ 16764 __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 18); \ 16765 \ 16766 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 16767 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 16768 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 16769 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \ 16770 __ret; \ 16771 }) 16772 #endif 16773 16774 #ifdef __LITTLE_ENDIAN__ 16775 #define vld4_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 16776 uint16x4x4_t __ret; \ 16777 uint16x4x4_t __s1 = __p1; \ 16778 __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 17); \ 16779 __ret; \ 16780 }) 16781 #else 16782 #define vld4_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 16783 uint16x4x4_t __ret; \ 16784 uint16x4x4_t __s1 = __p1; \ 16785 uint16x4x4_t __rev1; \ 16786 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 16787 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 16788 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 16789 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \ 16790 __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 17); \ 16791 \ 16792 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 16793 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 16794 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 16795 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \ 16796 __ret; \ 16797 }) 16798 #endif 16799 16800 #ifdef __LITTLE_ENDIAN__ 16801 #define vld4_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 16802 int8x8x4_t __ret; \ 16803 int8x8x4_t __s1 = __p1; \ 16804 __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 0); \ 16805 __ret; \ 16806 }) 16807 #else 16808 #define vld4_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 16809 int8x8x4_t __ret; \ 16810 int8x8x4_t __s1 = __p1; \ 16811 int8x8x4_t __rev1; \ 16812 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 16813 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 16814 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 16815 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 16816 __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 0); \ 16817 \ 16818 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 16819 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 16820 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 16821 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 16822 __ret; \ 16823 }) 16824 #endif 16825 16826 #ifdef __LITTLE_ENDIAN__ 16827 #define vld4_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 16828 float32x2x4_t __ret; \ 16829 float32x2x4_t __s1 = __p1; \ 16830 __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 9); \ 16831 __ret; \ 16832 }) 16833 #else 16834 #define vld4_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 16835 float32x2x4_t __ret; \ 16836 float32x2x4_t __s1 = __p1; \ 16837 float32x2x4_t __rev1; \ 16838 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 16839 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 16840 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 16841 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \ 16842 __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 9); \ 16843 \ 16844 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 16845 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 16846 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 16847 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \ 16848 __ret; \ 16849 }) 16850 #endif 16851 16852 #ifdef __LITTLE_ENDIAN__ 16853 #define vld4_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 16854 int32x2x4_t __ret; \ 16855 int32x2x4_t __s1 = __p1; \ 16856 __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 2); \ 16857 __ret; \ 16858 }) 16859 #else 16860 #define vld4_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 16861 int32x2x4_t __ret; \ 16862 int32x2x4_t __s1 = __p1; \ 16863 int32x2x4_t __rev1; \ 16864 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 16865 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 16866 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 16867 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \ 16868 __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 2); \ 16869 \ 16870 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 16871 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 16872 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 16873 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \ 16874 __ret; \ 16875 }) 16876 #endif 16877 16878 #ifdef __LITTLE_ENDIAN__ 16879 #define vld4_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 16880 int16x4x4_t __ret; \ 16881 int16x4x4_t __s1 = __p1; \ 16882 __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 1); \ 16883 __ret; \ 16884 }) 16885 #else 16886 #define vld4_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 16887 int16x4x4_t __ret; \ 16888 int16x4x4_t __s1 = __p1; \ 16889 int16x4x4_t __rev1; \ 16890 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 16891 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 16892 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 16893 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \ 16894 __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 1); \ 16895 \ 16896 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 16897 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 16898 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 16899 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \ 16900 __ret; \ 16901 }) 16902 #endif 16903 16904 #ifdef __LITTLE_ENDIAN__ 16905 __ai __attribute__((target("neon"))) uint8x16_t vmaxq_u8(uint8x16_t __p0, uint8x16_t __p1) { 16906 uint8x16_t __ret; 16907 __ret = (uint8x16_t) __builtin_neon_vmaxq_v((int8x16_t)__p0, (int8x16_t)__p1, 48); 16908 return __ret; 16909 } 16910 #else 16911 __ai __attribute__((target("neon"))) uint8x16_t vmaxq_u8(uint8x16_t __p0, uint8x16_t __p1) { 16912 uint8x16_t __ret; 16913 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 16914 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 16915 __ret = (uint8x16_t) __builtin_neon_vmaxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48); 16916 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 16917 return __ret; 16918 } 16919 #endif 16920 16921 #ifdef __LITTLE_ENDIAN__ 16922 __ai __attribute__((target("neon"))) uint32x4_t vmaxq_u32(uint32x4_t __p0, uint32x4_t __p1) { 16923 uint32x4_t __ret; 16924 __ret = (uint32x4_t) __builtin_neon_vmaxq_v((int8x16_t)__p0, (int8x16_t)__p1, 50); 16925 return __ret; 16926 } 16927 #else 16928 __ai __attribute__((target("neon"))) uint32x4_t vmaxq_u32(uint32x4_t __p0, uint32x4_t __p1) { 16929 uint32x4_t __ret; 16930 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 16931 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 16932 __ret = (uint32x4_t) __builtin_neon_vmaxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50); 16933 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 16934 return __ret; 16935 } 16936 #endif 16937 16938 #ifdef __LITTLE_ENDIAN__ 16939 __ai __attribute__((target("neon"))) uint16x8_t vmaxq_u16(uint16x8_t __p0, uint16x8_t __p1) { 16940 uint16x8_t __ret; 16941 __ret = (uint16x8_t) __builtin_neon_vmaxq_v((int8x16_t)__p0, (int8x16_t)__p1, 49); 16942 return __ret; 16943 } 16944 #else 16945 __ai __attribute__((target("neon"))) uint16x8_t vmaxq_u16(uint16x8_t __p0, uint16x8_t __p1) { 16946 uint16x8_t __ret; 16947 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 16948 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 16949 __ret = (uint16x8_t) __builtin_neon_vmaxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49); 16950 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 16951 return __ret; 16952 } 16953 #endif 16954 16955 #ifdef __LITTLE_ENDIAN__ 16956 __ai __attribute__((target("neon"))) int8x16_t vmaxq_s8(int8x16_t __p0, int8x16_t __p1) { 16957 int8x16_t __ret; 16958 __ret = (int8x16_t) __builtin_neon_vmaxq_v((int8x16_t)__p0, (int8x16_t)__p1, 32); 16959 return __ret; 16960 } 16961 #else 16962 __ai __attribute__((target("neon"))) int8x16_t vmaxq_s8(int8x16_t __p0, int8x16_t __p1) { 16963 int8x16_t __ret; 16964 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 16965 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 16966 __ret = (int8x16_t) __builtin_neon_vmaxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32); 16967 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 16968 return __ret; 16969 } 16970 #endif 16971 16972 #ifdef __LITTLE_ENDIAN__ 16973 __ai __attribute__((target("neon"))) float32x4_t vmaxq_f32(float32x4_t __p0, float32x4_t __p1) { 16974 float32x4_t __ret; 16975 __ret = (float32x4_t) __builtin_neon_vmaxq_v((int8x16_t)__p0, (int8x16_t)__p1, 41); 16976 return __ret; 16977 } 16978 #else 16979 __ai __attribute__((target("neon"))) float32x4_t vmaxq_f32(float32x4_t __p0, float32x4_t __p1) { 16980 float32x4_t __ret; 16981 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 16982 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 16983 __ret = (float32x4_t) __builtin_neon_vmaxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 41); 16984 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 16985 return __ret; 16986 } 16987 #endif 16988 16989 #ifdef __LITTLE_ENDIAN__ 16990 __ai __attribute__((target("neon"))) int32x4_t vmaxq_s32(int32x4_t __p0, int32x4_t __p1) { 16991 int32x4_t __ret; 16992 __ret = (int32x4_t) __builtin_neon_vmaxq_v((int8x16_t)__p0, (int8x16_t)__p1, 34); 16993 return __ret; 16994 } 16995 #else 16996 __ai __attribute__((target("neon"))) int32x4_t vmaxq_s32(int32x4_t __p0, int32x4_t __p1) { 16997 int32x4_t __ret; 16998 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 16999 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 17000 __ret = (int32x4_t) __builtin_neon_vmaxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34); 17001 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 17002 return __ret; 17003 } 17004 #endif 17005 17006 #ifdef __LITTLE_ENDIAN__ 17007 __ai __attribute__((target("neon"))) int16x8_t vmaxq_s16(int16x8_t __p0, int16x8_t __p1) { 17008 int16x8_t __ret; 17009 __ret = (int16x8_t) __builtin_neon_vmaxq_v((int8x16_t)__p0, (int8x16_t)__p1, 33); 17010 return __ret; 17011 } 17012 #else 17013 __ai __attribute__((target("neon"))) int16x8_t vmaxq_s16(int16x8_t __p0, int16x8_t __p1) { 17014 int16x8_t __ret; 17015 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 17016 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 17017 __ret = (int16x8_t) __builtin_neon_vmaxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33); 17018 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 17019 return __ret; 17020 } 17021 #endif 17022 17023 #ifdef __LITTLE_ENDIAN__ 17024 __ai __attribute__((target("neon"))) uint8x8_t vmax_u8(uint8x8_t __p0, uint8x8_t __p1) { 17025 uint8x8_t __ret; 17026 __ret = (uint8x8_t) __builtin_neon_vmax_v((int8x8_t)__p0, (int8x8_t)__p1, 16); 17027 return __ret; 17028 } 17029 #else 17030 __ai __attribute__((target("neon"))) uint8x8_t vmax_u8(uint8x8_t __p0, uint8x8_t __p1) { 17031 uint8x8_t __ret; 17032 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 17033 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 17034 __ret = (uint8x8_t) __builtin_neon_vmax_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16); 17035 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 17036 return __ret; 17037 } 17038 #endif 17039 17040 #ifdef __LITTLE_ENDIAN__ 17041 __ai __attribute__((target("neon"))) uint32x2_t vmax_u32(uint32x2_t __p0, uint32x2_t __p1) { 17042 uint32x2_t __ret; 17043 __ret = (uint32x2_t) __builtin_neon_vmax_v((int8x8_t)__p0, (int8x8_t)__p1, 18); 17044 return __ret; 17045 } 17046 #else 17047 __ai __attribute__((target("neon"))) uint32x2_t vmax_u32(uint32x2_t __p0, uint32x2_t __p1) { 17048 uint32x2_t __ret; 17049 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 17050 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 17051 __ret = (uint32x2_t) __builtin_neon_vmax_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18); 17052 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 17053 return __ret; 17054 } 17055 #endif 17056 17057 #ifdef __LITTLE_ENDIAN__ 17058 __ai __attribute__((target("neon"))) uint16x4_t vmax_u16(uint16x4_t __p0, uint16x4_t __p1) { 17059 uint16x4_t __ret; 17060 __ret = (uint16x4_t) __builtin_neon_vmax_v((int8x8_t)__p0, (int8x8_t)__p1, 17); 17061 return __ret; 17062 } 17063 #else 17064 __ai __attribute__((target("neon"))) uint16x4_t vmax_u16(uint16x4_t __p0, uint16x4_t __p1) { 17065 uint16x4_t __ret; 17066 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 17067 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 17068 __ret = (uint16x4_t) __builtin_neon_vmax_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17); 17069 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 17070 return __ret; 17071 } 17072 #endif 17073 17074 #ifdef __LITTLE_ENDIAN__ 17075 __ai __attribute__((target("neon"))) int8x8_t vmax_s8(int8x8_t __p0, int8x8_t __p1) { 17076 int8x8_t __ret; 17077 __ret = (int8x8_t) __builtin_neon_vmax_v((int8x8_t)__p0, (int8x8_t)__p1, 0); 17078 return __ret; 17079 } 17080 #else 17081 __ai __attribute__((target("neon"))) int8x8_t vmax_s8(int8x8_t __p0, int8x8_t __p1) { 17082 int8x8_t __ret; 17083 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 17084 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 17085 __ret = (int8x8_t) __builtin_neon_vmax_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0); 17086 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 17087 return __ret; 17088 } 17089 #endif 17090 17091 #ifdef __LITTLE_ENDIAN__ 17092 __ai __attribute__((target("neon"))) float32x2_t vmax_f32(float32x2_t __p0, float32x2_t __p1) { 17093 float32x2_t __ret; 17094 __ret = (float32x2_t) __builtin_neon_vmax_v((int8x8_t)__p0, (int8x8_t)__p1, 9); 17095 return __ret; 17096 } 17097 #else 17098 __ai __attribute__((target("neon"))) float32x2_t vmax_f32(float32x2_t __p0, float32x2_t __p1) { 17099 float32x2_t __ret; 17100 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 17101 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 17102 __ret = (float32x2_t) __builtin_neon_vmax_v((int8x8_t)__rev0, (int8x8_t)__rev1, 9); 17103 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 17104 return __ret; 17105 } 17106 #endif 17107 17108 #ifdef __LITTLE_ENDIAN__ 17109 __ai __attribute__((target("neon"))) int32x2_t vmax_s32(int32x2_t __p0, int32x2_t __p1) { 17110 int32x2_t __ret; 17111 __ret = (int32x2_t) __builtin_neon_vmax_v((int8x8_t)__p0, (int8x8_t)__p1, 2); 17112 return __ret; 17113 } 17114 #else 17115 __ai __attribute__((target("neon"))) int32x2_t vmax_s32(int32x2_t __p0, int32x2_t __p1) { 17116 int32x2_t __ret; 17117 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 17118 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 17119 __ret = (int32x2_t) __builtin_neon_vmax_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2); 17120 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 17121 return __ret; 17122 } 17123 #endif 17124 17125 #ifdef __LITTLE_ENDIAN__ 17126 __ai __attribute__((target("neon"))) int16x4_t vmax_s16(int16x4_t __p0, int16x4_t __p1) { 17127 int16x4_t __ret; 17128 __ret = (int16x4_t) __builtin_neon_vmax_v((int8x8_t)__p0, (int8x8_t)__p1, 1); 17129 return __ret; 17130 } 17131 #else 17132 __ai __attribute__((target("neon"))) int16x4_t vmax_s16(int16x4_t __p0, int16x4_t __p1) { 17133 int16x4_t __ret; 17134 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 17135 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 17136 __ret = (int16x4_t) __builtin_neon_vmax_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1); 17137 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 17138 return __ret; 17139 } 17140 #endif 17141 17142 #ifdef __LITTLE_ENDIAN__ 17143 __ai __attribute__((target("neon"))) uint8x16_t vminq_u8(uint8x16_t __p0, uint8x16_t __p1) { 17144 uint8x16_t __ret; 17145 __ret = (uint8x16_t) __builtin_neon_vminq_v((int8x16_t)__p0, (int8x16_t)__p1, 48); 17146 return __ret; 17147 } 17148 #else 17149 __ai __attribute__((target("neon"))) uint8x16_t vminq_u8(uint8x16_t __p0, uint8x16_t __p1) { 17150 uint8x16_t __ret; 17151 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 17152 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 17153 __ret = (uint8x16_t) __builtin_neon_vminq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48); 17154 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 17155 return __ret; 17156 } 17157 #endif 17158 17159 #ifdef __LITTLE_ENDIAN__ 17160 __ai __attribute__((target("neon"))) uint32x4_t vminq_u32(uint32x4_t __p0, uint32x4_t __p1) { 17161 uint32x4_t __ret; 17162 __ret = (uint32x4_t) __builtin_neon_vminq_v((int8x16_t)__p0, (int8x16_t)__p1, 50); 17163 return __ret; 17164 } 17165 #else 17166 __ai __attribute__((target("neon"))) uint32x4_t vminq_u32(uint32x4_t __p0, uint32x4_t __p1) { 17167 uint32x4_t __ret; 17168 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 17169 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 17170 __ret = (uint32x4_t) __builtin_neon_vminq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50); 17171 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 17172 return __ret; 17173 } 17174 #endif 17175 17176 #ifdef __LITTLE_ENDIAN__ 17177 __ai __attribute__((target("neon"))) uint16x8_t vminq_u16(uint16x8_t __p0, uint16x8_t __p1) { 17178 uint16x8_t __ret; 17179 __ret = (uint16x8_t) __builtin_neon_vminq_v((int8x16_t)__p0, (int8x16_t)__p1, 49); 17180 return __ret; 17181 } 17182 #else 17183 __ai __attribute__((target("neon"))) uint16x8_t vminq_u16(uint16x8_t __p0, uint16x8_t __p1) { 17184 uint16x8_t __ret; 17185 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 17186 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 17187 __ret = (uint16x8_t) __builtin_neon_vminq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49); 17188 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 17189 return __ret; 17190 } 17191 #endif 17192 17193 #ifdef __LITTLE_ENDIAN__ 17194 __ai __attribute__((target("neon"))) int8x16_t vminq_s8(int8x16_t __p0, int8x16_t __p1) { 17195 int8x16_t __ret; 17196 __ret = (int8x16_t) __builtin_neon_vminq_v((int8x16_t)__p0, (int8x16_t)__p1, 32); 17197 return __ret; 17198 } 17199 #else 17200 __ai __attribute__((target("neon"))) int8x16_t vminq_s8(int8x16_t __p0, int8x16_t __p1) { 17201 int8x16_t __ret; 17202 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 17203 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 17204 __ret = (int8x16_t) __builtin_neon_vminq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32); 17205 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 17206 return __ret; 17207 } 17208 #endif 17209 17210 #ifdef __LITTLE_ENDIAN__ 17211 __ai __attribute__((target("neon"))) float32x4_t vminq_f32(float32x4_t __p0, float32x4_t __p1) { 17212 float32x4_t __ret; 17213 __ret = (float32x4_t) __builtin_neon_vminq_v((int8x16_t)__p0, (int8x16_t)__p1, 41); 17214 return __ret; 17215 } 17216 #else 17217 __ai __attribute__((target("neon"))) float32x4_t vminq_f32(float32x4_t __p0, float32x4_t __p1) { 17218 float32x4_t __ret; 17219 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 17220 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 17221 __ret = (float32x4_t) __builtin_neon_vminq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 41); 17222 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 17223 return __ret; 17224 } 17225 #endif 17226 17227 #ifdef __LITTLE_ENDIAN__ 17228 __ai __attribute__((target("neon"))) int32x4_t vminq_s32(int32x4_t __p0, int32x4_t __p1) { 17229 int32x4_t __ret; 17230 __ret = (int32x4_t) __builtin_neon_vminq_v((int8x16_t)__p0, (int8x16_t)__p1, 34); 17231 return __ret; 17232 } 17233 #else 17234 __ai __attribute__((target("neon"))) int32x4_t vminq_s32(int32x4_t __p0, int32x4_t __p1) { 17235 int32x4_t __ret; 17236 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 17237 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 17238 __ret = (int32x4_t) __builtin_neon_vminq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34); 17239 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 17240 return __ret; 17241 } 17242 #endif 17243 17244 #ifdef __LITTLE_ENDIAN__ 17245 __ai __attribute__((target("neon"))) int16x8_t vminq_s16(int16x8_t __p0, int16x8_t __p1) { 17246 int16x8_t __ret; 17247 __ret = (int16x8_t) __builtin_neon_vminq_v((int8x16_t)__p0, (int8x16_t)__p1, 33); 17248 return __ret; 17249 } 17250 #else 17251 __ai __attribute__((target("neon"))) int16x8_t vminq_s16(int16x8_t __p0, int16x8_t __p1) { 17252 int16x8_t __ret; 17253 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 17254 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 17255 __ret = (int16x8_t) __builtin_neon_vminq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33); 17256 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 17257 return __ret; 17258 } 17259 #endif 17260 17261 #ifdef __LITTLE_ENDIAN__ 17262 __ai __attribute__((target("neon"))) uint8x8_t vmin_u8(uint8x8_t __p0, uint8x8_t __p1) { 17263 uint8x8_t __ret; 17264 __ret = (uint8x8_t) __builtin_neon_vmin_v((int8x8_t)__p0, (int8x8_t)__p1, 16); 17265 return __ret; 17266 } 17267 #else 17268 __ai __attribute__((target("neon"))) uint8x8_t vmin_u8(uint8x8_t __p0, uint8x8_t __p1) { 17269 uint8x8_t __ret; 17270 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 17271 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 17272 __ret = (uint8x8_t) __builtin_neon_vmin_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16); 17273 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 17274 return __ret; 17275 } 17276 #endif 17277 17278 #ifdef __LITTLE_ENDIAN__ 17279 __ai __attribute__((target("neon"))) uint32x2_t vmin_u32(uint32x2_t __p0, uint32x2_t __p1) { 17280 uint32x2_t __ret; 17281 __ret = (uint32x2_t) __builtin_neon_vmin_v((int8x8_t)__p0, (int8x8_t)__p1, 18); 17282 return __ret; 17283 } 17284 #else 17285 __ai __attribute__((target("neon"))) uint32x2_t vmin_u32(uint32x2_t __p0, uint32x2_t __p1) { 17286 uint32x2_t __ret; 17287 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 17288 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 17289 __ret = (uint32x2_t) __builtin_neon_vmin_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18); 17290 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 17291 return __ret; 17292 } 17293 #endif 17294 17295 #ifdef __LITTLE_ENDIAN__ 17296 __ai __attribute__((target("neon"))) uint16x4_t vmin_u16(uint16x4_t __p0, uint16x4_t __p1) { 17297 uint16x4_t __ret; 17298 __ret = (uint16x4_t) __builtin_neon_vmin_v((int8x8_t)__p0, (int8x8_t)__p1, 17); 17299 return __ret; 17300 } 17301 #else 17302 __ai __attribute__((target("neon"))) uint16x4_t vmin_u16(uint16x4_t __p0, uint16x4_t __p1) { 17303 uint16x4_t __ret; 17304 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 17305 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 17306 __ret = (uint16x4_t) __builtin_neon_vmin_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17); 17307 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 17308 return __ret; 17309 } 17310 #endif 17311 17312 #ifdef __LITTLE_ENDIAN__ 17313 __ai __attribute__((target("neon"))) int8x8_t vmin_s8(int8x8_t __p0, int8x8_t __p1) { 17314 int8x8_t __ret; 17315 __ret = (int8x8_t) __builtin_neon_vmin_v((int8x8_t)__p0, (int8x8_t)__p1, 0); 17316 return __ret; 17317 } 17318 #else 17319 __ai __attribute__((target("neon"))) int8x8_t vmin_s8(int8x8_t __p0, int8x8_t __p1) { 17320 int8x8_t __ret; 17321 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 17322 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 17323 __ret = (int8x8_t) __builtin_neon_vmin_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0); 17324 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 17325 return __ret; 17326 } 17327 #endif 17328 17329 #ifdef __LITTLE_ENDIAN__ 17330 __ai __attribute__((target("neon"))) float32x2_t vmin_f32(float32x2_t __p0, float32x2_t __p1) { 17331 float32x2_t __ret; 17332 __ret = (float32x2_t) __builtin_neon_vmin_v((int8x8_t)__p0, (int8x8_t)__p1, 9); 17333 return __ret; 17334 } 17335 #else 17336 __ai __attribute__((target("neon"))) float32x2_t vmin_f32(float32x2_t __p0, float32x2_t __p1) { 17337 float32x2_t __ret; 17338 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 17339 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 17340 __ret = (float32x2_t) __builtin_neon_vmin_v((int8x8_t)__rev0, (int8x8_t)__rev1, 9); 17341 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 17342 return __ret; 17343 } 17344 #endif 17345 17346 #ifdef __LITTLE_ENDIAN__ 17347 __ai __attribute__((target("neon"))) int32x2_t vmin_s32(int32x2_t __p0, int32x2_t __p1) { 17348 int32x2_t __ret; 17349 __ret = (int32x2_t) __builtin_neon_vmin_v((int8x8_t)__p0, (int8x8_t)__p1, 2); 17350 return __ret; 17351 } 17352 #else 17353 __ai __attribute__((target("neon"))) int32x2_t vmin_s32(int32x2_t __p0, int32x2_t __p1) { 17354 int32x2_t __ret; 17355 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 17356 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 17357 __ret = (int32x2_t) __builtin_neon_vmin_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2); 17358 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 17359 return __ret; 17360 } 17361 #endif 17362 17363 #ifdef __LITTLE_ENDIAN__ 17364 __ai __attribute__((target("neon"))) int16x4_t vmin_s16(int16x4_t __p0, int16x4_t __p1) { 17365 int16x4_t __ret; 17366 __ret = (int16x4_t) __builtin_neon_vmin_v((int8x8_t)__p0, (int8x8_t)__p1, 1); 17367 return __ret; 17368 } 17369 #else 17370 __ai __attribute__((target("neon"))) int16x4_t vmin_s16(int16x4_t __p0, int16x4_t __p1) { 17371 int16x4_t __ret; 17372 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 17373 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 17374 __ret = (int16x4_t) __builtin_neon_vmin_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1); 17375 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 17376 return __ret; 17377 } 17378 #endif 17379 17380 #ifdef __LITTLE_ENDIAN__ 17381 __ai __attribute__((target("neon"))) uint8x16_t vmlaq_u8(uint8x16_t __p0, uint8x16_t __p1, uint8x16_t __p2) { 17382 uint8x16_t __ret; 17383 __ret = __p0 + __p1 * __p2; 17384 return __ret; 17385 } 17386 #else 17387 __ai __attribute__((target("neon"))) uint8x16_t vmlaq_u8(uint8x16_t __p0, uint8x16_t __p1, uint8x16_t __p2) { 17388 uint8x16_t __ret; 17389 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 17390 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 17391 uint8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 17392 __ret = __rev0 + __rev1 * __rev2; 17393 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 17394 return __ret; 17395 } 17396 #endif 17397 17398 #ifdef __LITTLE_ENDIAN__ 17399 __ai __attribute__((target("neon"))) uint32x4_t vmlaq_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 17400 uint32x4_t __ret; 17401 __ret = __p0 + __p1 * __p2; 17402 return __ret; 17403 } 17404 #else 17405 __ai __attribute__((target("neon"))) uint32x4_t vmlaq_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 17406 uint32x4_t __ret; 17407 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 17408 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 17409 uint32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 17410 __ret = __rev0 + __rev1 * __rev2; 17411 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 17412 return __ret; 17413 } 17414 #endif 17415 17416 #ifdef __LITTLE_ENDIAN__ 17417 __ai __attribute__((target("neon"))) uint16x8_t vmlaq_u16(uint16x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) { 17418 uint16x8_t __ret; 17419 __ret = __p0 + __p1 * __p2; 17420 return __ret; 17421 } 17422 #else 17423 __ai __attribute__((target("neon"))) uint16x8_t vmlaq_u16(uint16x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) { 17424 uint16x8_t __ret; 17425 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 17426 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 17427 uint16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 17428 __ret = __rev0 + __rev1 * __rev2; 17429 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 17430 return __ret; 17431 } 17432 #endif 17433 17434 #ifdef __LITTLE_ENDIAN__ 17435 __ai __attribute__((target("neon"))) int8x16_t vmlaq_s8(int8x16_t __p0, int8x16_t __p1, int8x16_t __p2) { 17436 int8x16_t __ret; 17437 __ret = __p0 + __p1 * __p2; 17438 return __ret; 17439 } 17440 #else 17441 __ai __attribute__((target("neon"))) int8x16_t vmlaq_s8(int8x16_t __p0, int8x16_t __p1, int8x16_t __p2) { 17442 int8x16_t __ret; 17443 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 17444 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 17445 int8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 17446 __ret = __rev0 + __rev1 * __rev2; 17447 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 17448 return __ret; 17449 } 17450 #endif 17451 17452 #ifdef __LITTLE_ENDIAN__ 17453 __ai __attribute__((target("neon"))) float32x4_t vmlaq_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) { 17454 float32x4_t __ret; 17455 __ret = __p0 + __p1 * __p2; 17456 return __ret; 17457 } 17458 #else 17459 __ai __attribute__((target("neon"))) float32x4_t vmlaq_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) { 17460 float32x4_t __ret; 17461 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 17462 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 17463 float32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 17464 __ret = __rev0 + __rev1 * __rev2; 17465 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 17466 return __ret; 17467 } 17468 #endif 17469 17470 #ifdef __LITTLE_ENDIAN__ 17471 __ai __attribute__((target("neon"))) int32x4_t vmlaq_s32(int32x4_t __p0, int32x4_t __p1, int32x4_t __p2) { 17472 int32x4_t __ret; 17473 __ret = __p0 + __p1 * __p2; 17474 return __ret; 17475 } 17476 #else 17477 __ai __attribute__((target("neon"))) int32x4_t vmlaq_s32(int32x4_t __p0, int32x4_t __p1, int32x4_t __p2) { 17478 int32x4_t __ret; 17479 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 17480 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 17481 int32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 17482 __ret = __rev0 + __rev1 * __rev2; 17483 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 17484 return __ret; 17485 } 17486 #endif 17487 17488 #ifdef __LITTLE_ENDIAN__ 17489 __ai __attribute__((target("neon"))) int16x8_t vmlaq_s16(int16x8_t __p0, int16x8_t __p1, int16x8_t __p2) { 17490 int16x8_t __ret; 17491 __ret = __p0 + __p1 * __p2; 17492 return __ret; 17493 } 17494 #else 17495 __ai __attribute__((target("neon"))) int16x8_t vmlaq_s16(int16x8_t __p0, int16x8_t __p1, int16x8_t __p2) { 17496 int16x8_t __ret; 17497 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 17498 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 17499 int16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 17500 __ret = __rev0 + __rev1 * __rev2; 17501 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 17502 return __ret; 17503 } 17504 #endif 17505 17506 #ifdef __LITTLE_ENDIAN__ 17507 __ai __attribute__((target("neon"))) uint8x8_t vmla_u8(uint8x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) { 17508 uint8x8_t __ret; 17509 __ret = __p0 + __p1 * __p2; 17510 return __ret; 17511 } 17512 #else 17513 __ai __attribute__((target("neon"))) uint8x8_t vmla_u8(uint8x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) { 17514 uint8x8_t __ret; 17515 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 17516 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 17517 uint8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 17518 __ret = __rev0 + __rev1 * __rev2; 17519 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 17520 return __ret; 17521 } 17522 #endif 17523 17524 #ifdef __LITTLE_ENDIAN__ 17525 __ai __attribute__((target("neon"))) uint32x2_t vmla_u32(uint32x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) { 17526 uint32x2_t __ret; 17527 __ret = __p0 + __p1 * __p2; 17528 return __ret; 17529 } 17530 #else 17531 __ai __attribute__((target("neon"))) uint32x2_t vmla_u32(uint32x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) { 17532 uint32x2_t __ret; 17533 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 17534 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 17535 uint32x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 17536 __ret = __rev0 + __rev1 * __rev2; 17537 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 17538 return __ret; 17539 } 17540 #endif 17541 17542 #ifdef __LITTLE_ENDIAN__ 17543 __ai __attribute__((target("neon"))) uint16x4_t vmla_u16(uint16x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) { 17544 uint16x4_t __ret; 17545 __ret = __p0 + __p1 * __p2; 17546 return __ret; 17547 } 17548 #else 17549 __ai __attribute__((target("neon"))) uint16x4_t vmla_u16(uint16x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) { 17550 uint16x4_t __ret; 17551 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 17552 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 17553 uint16x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 17554 __ret = __rev0 + __rev1 * __rev2; 17555 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 17556 return __ret; 17557 } 17558 #endif 17559 17560 #ifdef __LITTLE_ENDIAN__ 17561 __ai __attribute__((target("neon"))) int8x8_t vmla_s8(int8x8_t __p0, int8x8_t __p1, int8x8_t __p2) { 17562 int8x8_t __ret; 17563 __ret = __p0 + __p1 * __p2; 17564 return __ret; 17565 } 17566 #else 17567 __ai __attribute__((target("neon"))) int8x8_t vmla_s8(int8x8_t __p0, int8x8_t __p1, int8x8_t __p2) { 17568 int8x8_t __ret; 17569 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 17570 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 17571 int8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 17572 __ret = __rev0 + __rev1 * __rev2; 17573 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 17574 return __ret; 17575 } 17576 #endif 17577 17578 #ifdef __LITTLE_ENDIAN__ 17579 __ai __attribute__((target("neon"))) float32x2_t vmla_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) { 17580 float32x2_t __ret; 17581 __ret = __p0 + __p1 * __p2; 17582 return __ret; 17583 } 17584 #else 17585 __ai __attribute__((target("neon"))) float32x2_t vmla_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) { 17586 float32x2_t __ret; 17587 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 17588 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 17589 float32x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 17590 __ret = __rev0 + __rev1 * __rev2; 17591 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 17592 return __ret; 17593 } 17594 #endif 17595 17596 #ifdef __LITTLE_ENDIAN__ 17597 __ai __attribute__((target("neon"))) int32x2_t vmla_s32(int32x2_t __p0, int32x2_t __p1, int32x2_t __p2) { 17598 int32x2_t __ret; 17599 __ret = __p0 + __p1 * __p2; 17600 return __ret; 17601 } 17602 #else 17603 __ai __attribute__((target("neon"))) int32x2_t vmla_s32(int32x2_t __p0, int32x2_t __p1, int32x2_t __p2) { 17604 int32x2_t __ret; 17605 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 17606 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 17607 int32x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 17608 __ret = __rev0 + __rev1 * __rev2; 17609 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 17610 return __ret; 17611 } 17612 #endif 17613 17614 #ifdef __LITTLE_ENDIAN__ 17615 __ai __attribute__((target("neon"))) int16x4_t vmla_s16(int16x4_t __p0, int16x4_t __p1, int16x4_t __p2) { 17616 int16x4_t __ret; 17617 __ret = __p0 + __p1 * __p2; 17618 return __ret; 17619 } 17620 #else 17621 __ai __attribute__((target("neon"))) int16x4_t vmla_s16(int16x4_t __p0, int16x4_t __p1, int16x4_t __p2) { 17622 int16x4_t __ret; 17623 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 17624 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 17625 int16x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 17626 __ret = __rev0 + __rev1 * __rev2; 17627 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 17628 return __ret; 17629 } 17630 #endif 17631 17632 #ifdef __LITTLE_ENDIAN__ 17633 #define vmlaq_lane_u32(__p0_54, __p1_54, __p2_54, __p3_54) __extension__ ({ \ 17634 uint32x4_t __ret_54; \ 17635 uint32x4_t __s0_54 = __p0_54; \ 17636 uint32x4_t __s1_54 = __p1_54; \ 17637 uint32x2_t __s2_54 = __p2_54; \ 17638 __ret_54 = __s0_54 + __s1_54 * splatq_lane_u32(__s2_54, __p3_54); \ 17639 __ret_54; \ 17640 }) 17641 #else 17642 #define vmlaq_lane_u32(__p0_55, __p1_55, __p2_55, __p3_55) __extension__ ({ \ 17643 uint32x4_t __ret_55; \ 17644 uint32x4_t __s0_55 = __p0_55; \ 17645 uint32x4_t __s1_55 = __p1_55; \ 17646 uint32x2_t __s2_55 = __p2_55; \ 17647 uint32x4_t __rev0_55; __rev0_55 = __builtin_shufflevector(__s0_55, __s0_55, 3, 2, 1, 0); \ 17648 uint32x4_t __rev1_55; __rev1_55 = __builtin_shufflevector(__s1_55, __s1_55, 3, 2, 1, 0); \ 17649 uint32x2_t __rev2_55; __rev2_55 = __builtin_shufflevector(__s2_55, __s2_55, 1, 0); \ 17650 __ret_55 = __rev0_55 + __rev1_55 * __noswap_splatq_lane_u32(__rev2_55, __p3_55); \ 17651 __ret_55 = __builtin_shufflevector(__ret_55, __ret_55, 3, 2, 1, 0); \ 17652 __ret_55; \ 17653 }) 17654 #endif 17655 17656 #ifdef __LITTLE_ENDIAN__ 17657 #define vmlaq_lane_u16(__p0_56, __p1_56, __p2_56, __p3_56) __extension__ ({ \ 17658 uint16x8_t __ret_56; \ 17659 uint16x8_t __s0_56 = __p0_56; \ 17660 uint16x8_t __s1_56 = __p1_56; \ 17661 uint16x4_t __s2_56 = __p2_56; \ 17662 __ret_56 = __s0_56 + __s1_56 * splatq_lane_u16(__s2_56, __p3_56); \ 17663 __ret_56; \ 17664 }) 17665 #else 17666 #define vmlaq_lane_u16(__p0_57, __p1_57, __p2_57, __p3_57) __extension__ ({ \ 17667 uint16x8_t __ret_57; \ 17668 uint16x8_t __s0_57 = __p0_57; \ 17669 uint16x8_t __s1_57 = __p1_57; \ 17670 uint16x4_t __s2_57 = __p2_57; \ 17671 uint16x8_t __rev0_57; __rev0_57 = __builtin_shufflevector(__s0_57, __s0_57, 7, 6, 5, 4, 3, 2, 1, 0); \ 17672 uint16x8_t __rev1_57; __rev1_57 = __builtin_shufflevector(__s1_57, __s1_57, 7, 6, 5, 4, 3, 2, 1, 0); \ 17673 uint16x4_t __rev2_57; __rev2_57 = __builtin_shufflevector(__s2_57, __s2_57, 3, 2, 1, 0); \ 17674 __ret_57 = __rev0_57 + __rev1_57 * __noswap_splatq_lane_u16(__rev2_57, __p3_57); \ 17675 __ret_57 = __builtin_shufflevector(__ret_57, __ret_57, 7, 6, 5, 4, 3, 2, 1, 0); \ 17676 __ret_57; \ 17677 }) 17678 #endif 17679 17680 #ifdef __LITTLE_ENDIAN__ 17681 #define vmlaq_lane_f32(__p0_58, __p1_58, __p2_58, __p3_58) __extension__ ({ \ 17682 float32x4_t __ret_58; \ 17683 float32x4_t __s0_58 = __p0_58; \ 17684 float32x4_t __s1_58 = __p1_58; \ 17685 float32x2_t __s2_58 = __p2_58; \ 17686 __ret_58 = __s0_58 + __s1_58 * splatq_lane_f32(__s2_58, __p3_58); \ 17687 __ret_58; \ 17688 }) 17689 #else 17690 #define vmlaq_lane_f32(__p0_59, __p1_59, __p2_59, __p3_59) __extension__ ({ \ 17691 float32x4_t __ret_59; \ 17692 float32x4_t __s0_59 = __p0_59; \ 17693 float32x4_t __s1_59 = __p1_59; \ 17694 float32x2_t __s2_59 = __p2_59; \ 17695 float32x4_t __rev0_59; __rev0_59 = __builtin_shufflevector(__s0_59, __s0_59, 3, 2, 1, 0); \ 17696 float32x4_t __rev1_59; __rev1_59 = __builtin_shufflevector(__s1_59, __s1_59, 3, 2, 1, 0); \ 17697 float32x2_t __rev2_59; __rev2_59 = __builtin_shufflevector(__s2_59, __s2_59, 1, 0); \ 17698 __ret_59 = __rev0_59 + __rev1_59 * __noswap_splatq_lane_f32(__rev2_59, __p3_59); \ 17699 __ret_59 = __builtin_shufflevector(__ret_59, __ret_59, 3, 2, 1, 0); \ 17700 __ret_59; \ 17701 }) 17702 #endif 17703 17704 #ifdef __LITTLE_ENDIAN__ 17705 #define vmlaq_lane_s32(__p0_60, __p1_60, __p2_60, __p3_60) __extension__ ({ \ 17706 int32x4_t __ret_60; \ 17707 int32x4_t __s0_60 = __p0_60; \ 17708 int32x4_t __s1_60 = __p1_60; \ 17709 int32x2_t __s2_60 = __p2_60; \ 17710 __ret_60 = __s0_60 + __s1_60 * splatq_lane_s32(__s2_60, __p3_60); \ 17711 __ret_60; \ 17712 }) 17713 #else 17714 #define vmlaq_lane_s32(__p0_61, __p1_61, __p2_61, __p3_61) __extension__ ({ \ 17715 int32x4_t __ret_61; \ 17716 int32x4_t __s0_61 = __p0_61; \ 17717 int32x4_t __s1_61 = __p1_61; \ 17718 int32x2_t __s2_61 = __p2_61; \ 17719 int32x4_t __rev0_61; __rev0_61 = __builtin_shufflevector(__s0_61, __s0_61, 3, 2, 1, 0); \ 17720 int32x4_t __rev1_61; __rev1_61 = __builtin_shufflevector(__s1_61, __s1_61, 3, 2, 1, 0); \ 17721 int32x2_t __rev2_61; __rev2_61 = __builtin_shufflevector(__s2_61, __s2_61, 1, 0); \ 17722 __ret_61 = __rev0_61 + __rev1_61 * __noswap_splatq_lane_s32(__rev2_61, __p3_61); \ 17723 __ret_61 = __builtin_shufflevector(__ret_61, __ret_61, 3, 2, 1, 0); \ 17724 __ret_61; \ 17725 }) 17726 #endif 17727 17728 #ifdef __LITTLE_ENDIAN__ 17729 #define vmlaq_lane_s16(__p0_62, __p1_62, __p2_62, __p3_62) __extension__ ({ \ 17730 int16x8_t __ret_62; \ 17731 int16x8_t __s0_62 = __p0_62; \ 17732 int16x8_t __s1_62 = __p1_62; \ 17733 int16x4_t __s2_62 = __p2_62; \ 17734 __ret_62 = __s0_62 + __s1_62 * splatq_lane_s16(__s2_62, __p3_62); \ 17735 __ret_62; \ 17736 }) 17737 #else 17738 #define vmlaq_lane_s16(__p0_63, __p1_63, __p2_63, __p3_63) __extension__ ({ \ 17739 int16x8_t __ret_63; \ 17740 int16x8_t __s0_63 = __p0_63; \ 17741 int16x8_t __s1_63 = __p1_63; \ 17742 int16x4_t __s2_63 = __p2_63; \ 17743 int16x8_t __rev0_63; __rev0_63 = __builtin_shufflevector(__s0_63, __s0_63, 7, 6, 5, 4, 3, 2, 1, 0); \ 17744 int16x8_t __rev1_63; __rev1_63 = __builtin_shufflevector(__s1_63, __s1_63, 7, 6, 5, 4, 3, 2, 1, 0); \ 17745 int16x4_t __rev2_63; __rev2_63 = __builtin_shufflevector(__s2_63, __s2_63, 3, 2, 1, 0); \ 17746 __ret_63 = __rev0_63 + __rev1_63 * __noswap_splatq_lane_s16(__rev2_63, __p3_63); \ 17747 __ret_63 = __builtin_shufflevector(__ret_63, __ret_63, 7, 6, 5, 4, 3, 2, 1, 0); \ 17748 __ret_63; \ 17749 }) 17750 #endif 17751 17752 #ifdef __LITTLE_ENDIAN__ 17753 #define vmla_lane_u32(__p0_64, __p1_64, __p2_64, __p3_64) __extension__ ({ \ 17754 uint32x2_t __ret_64; \ 17755 uint32x2_t __s0_64 = __p0_64; \ 17756 uint32x2_t __s1_64 = __p1_64; \ 17757 uint32x2_t __s2_64 = __p2_64; \ 17758 __ret_64 = __s0_64 + __s1_64 * splat_lane_u32(__s2_64, __p3_64); \ 17759 __ret_64; \ 17760 }) 17761 #else 17762 #define vmla_lane_u32(__p0_65, __p1_65, __p2_65, __p3_65) __extension__ ({ \ 17763 uint32x2_t __ret_65; \ 17764 uint32x2_t __s0_65 = __p0_65; \ 17765 uint32x2_t __s1_65 = __p1_65; \ 17766 uint32x2_t __s2_65 = __p2_65; \ 17767 uint32x2_t __rev0_65; __rev0_65 = __builtin_shufflevector(__s0_65, __s0_65, 1, 0); \ 17768 uint32x2_t __rev1_65; __rev1_65 = __builtin_shufflevector(__s1_65, __s1_65, 1, 0); \ 17769 uint32x2_t __rev2_65; __rev2_65 = __builtin_shufflevector(__s2_65, __s2_65, 1, 0); \ 17770 __ret_65 = __rev0_65 + __rev1_65 * __noswap_splat_lane_u32(__rev2_65, __p3_65); \ 17771 __ret_65 = __builtin_shufflevector(__ret_65, __ret_65, 1, 0); \ 17772 __ret_65; \ 17773 }) 17774 #endif 17775 17776 #ifdef __LITTLE_ENDIAN__ 17777 #define vmla_lane_u16(__p0_66, __p1_66, __p2_66, __p3_66) __extension__ ({ \ 17778 uint16x4_t __ret_66; \ 17779 uint16x4_t __s0_66 = __p0_66; \ 17780 uint16x4_t __s1_66 = __p1_66; \ 17781 uint16x4_t __s2_66 = __p2_66; \ 17782 __ret_66 = __s0_66 + __s1_66 * splat_lane_u16(__s2_66, __p3_66); \ 17783 __ret_66; \ 17784 }) 17785 #else 17786 #define vmla_lane_u16(__p0_67, __p1_67, __p2_67, __p3_67) __extension__ ({ \ 17787 uint16x4_t __ret_67; \ 17788 uint16x4_t __s0_67 = __p0_67; \ 17789 uint16x4_t __s1_67 = __p1_67; \ 17790 uint16x4_t __s2_67 = __p2_67; \ 17791 uint16x4_t __rev0_67; __rev0_67 = __builtin_shufflevector(__s0_67, __s0_67, 3, 2, 1, 0); \ 17792 uint16x4_t __rev1_67; __rev1_67 = __builtin_shufflevector(__s1_67, __s1_67, 3, 2, 1, 0); \ 17793 uint16x4_t __rev2_67; __rev2_67 = __builtin_shufflevector(__s2_67, __s2_67, 3, 2, 1, 0); \ 17794 __ret_67 = __rev0_67 + __rev1_67 * __noswap_splat_lane_u16(__rev2_67, __p3_67); \ 17795 __ret_67 = __builtin_shufflevector(__ret_67, __ret_67, 3, 2, 1, 0); \ 17796 __ret_67; \ 17797 }) 17798 #endif 17799 17800 #ifdef __LITTLE_ENDIAN__ 17801 #define vmla_lane_f32(__p0_68, __p1_68, __p2_68, __p3_68) __extension__ ({ \ 17802 float32x2_t __ret_68; \ 17803 float32x2_t __s0_68 = __p0_68; \ 17804 float32x2_t __s1_68 = __p1_68; \ 17805 float32x2_t __s2_68 = __p2_68; \ 17806 __ret_68 = __s0_68 + __s1_68 * splat_lane_f32(__s2_68, __p3_68); \ 17807 __ret_68; \ 17808 }) 17809 #else 17810 #define vmla_lane_f32(__p0_69, __p1_69, __p2_69, __p3_69) __extension__ ({ \ 17811 float32x2_t __ret_69; \ 17812 float32x2_t __s0_69 = __p0_69; \ 17813 float32x2_t __s1_69 = __p1_69; \ 17814 float32x2_t __s2_69 = __p2_69; \ 17815 float32x2_t __rev0_69; __rev0_69 = __builtin_shufflevector(__s0_69, __s0_69, 1, 0); \ 17816 float32x2_t __rev1_69; __rev1_69 = __builtin_shufflevector(__s1_69, __s1_69, 1, 0); \ 17817 float32x2_t __rev2_69; __rev2_69 = __builtin_shufflevector(__s2_69, __s2_69, 1, 0); \ 17818 __ret_69 = __rev0_69 + __rev1_69 * __noswap_splat_lane_f32(__rev2_69, __p3_69); \ 17819 __ret_69 = __builtin_shufflevector(__ret_69, __ret_69, 1, 0); \ 17820 __ret_69; \ 17821 }) 17822 #endif 17823 17824 #ifdef __LITTLE_ENDIAN__ 17825 #define vmla_lane_s32(__p0_70, __p1_70, __p2_70, __p3_70) __extension__ ({ \ 17826 int32x2_t __ret_70; \ 17827 int32x2_t __s0_70 = __p0_70; \ 17828 int32x2_t __s1_70 = __p1_70; \ 17829 int32x2_t __s2_70 = __p2_70; \ 17830 __ret_70 = __s0_70 + __s1_70 * splat_lane_s32(__s2_70, __p3_70); \ 17831 __ret_70; \ 17832 }) 17833 #else 17834 #define vmla_lane_s32(__p0_71, __p1_71, __p2_71, __p3_71) __extension__ ({ \ 17835 int32x2_t __ret_71; \ 17836 int32x2_t __s0_71 = __p0_71; \ 17837 int32x2_t __s1_71 = __p1_71; \ 17838 int32x2_t __s2_71 = __p2_71; \ 17839 int32x2_t __rev0_71; __rev0_71 = __builtin_shufflevector(__s0_71, __s0_71, 1, 0); \ 17840 int32x2_t __rev1_71; __rev1_71 = __builtin_shufflevector(__s1_71, __s1_71, 1, 0); \ 17841 int32x2_t __rev2_71; __rev2_71 = __builtin_shufflevector(__s2_71, __s2_71, 1, 0); \ 17842 __ret_71 = __rev0_71 + __rev1_71 * __noswap_splat_lane_s32(__rev2_71, __p3_71); \ 17843 __ret_71 = __builtin_shufflevector(__ret_71, __ret_71, 1, 0); \ 17844 __ret_71; \ 17845 }) 17846 #endif 17847 17848 #ifdef __LITTLE_ENDIAN__ 17849 #define vmla_lane_s16(__p0_72, __p1_72, __p2_72, __p3_72) __extension__ ({ \ 17850 int16x4_t __ret_72; \ 17851 int16x4_t __s0_72 = __p0_72; \ 17852 int16x4_t __s1_72 = __p1_72; \ 17853 int16x4_t __s2_72 = __p2_72; \ 17854 __ret_72 = __s0_72 + __s1_72 * splat_lane_s16(__s2_72, __p3_72); \ 17855 __ret_72; \ 17856 }) 17857 #else 17858 #define vmla_lane_s16(__p0_73, __p1_73, __p2_73, __p3_73) __extension__ ({ \ 17859 int16x4_t __ret_73; \ 17860 int16x4_t __s0_73 = __p0_73; \ 17861 int16x4_t __s1_73 = __p1_73; \ 17862 int16x4_t __s2_73 = __p2_73; \ 17863 int16x4_t __rev0_73; __rev0_73 = __builtin_shufflevector(__s0_73, __s0_73, 3, 2, 1, 0); \ 17864 int16x4_t __rev1_73; __rev1_73 = __builtin_shufflevector(__s1_73, __s1_73, 3, 2, 1, 0); \ 17865 int16x4_t __rev2_73; __rev2_73 = __builtin_shufflevector(__s2_73, __s2_73, 3, 2, 1, 0); \ 17866 __ret_73 = __rev0_73 + __rev1_73 * __noswap_splat_lane_s16(__rev2_73, __p3_73); \ 17867 __ret_73 = __builtin_shufflevector(__ret_73, __ret_73, 3, 2, 1, 0); \ 17868 __ret_73; \ 17869 }) 17870 #endif 17871 17872 #ifdef __LITTLE_ENDIAN__ 17873 __ai __attribute__((target("neon"))) uint32x4_t vmlaq_n_u32(uint32x4_t __p0, uint32x4_t __p1, uint32_t __p2) { 17874 uint32x4_t __ret; 17875 __ret = __p0 + __p1 * (uint32x4_t) {__p2, __p2, __p2, __p2}; 17876 return __ret; 17877 } 17878 #else 17879 __ai __attribute__((target("neon"))) uint32x4_t vmlaq_n_u32(uint32x4_t __p0, uint32x4_t __p1, uint32_t __p2) { 17880 uint32x4_t __ret; 17881 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 17882 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 17883 __ret = __rev0 + __rev1 * (uint32x4_t) {__p2, __p2, __p2, __p2}; 17884 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 17885 return __ret; 17886 } 17887 #endif 17888 17889 #ifdef __LITTLE_ENDIAN__ 17890 __ai __attribute__((target("neon"))) uint16x8_t vmlaq_n_u16(uint16x8_t __p0, uint16x8_t __p1, uint16_t __p2) { 17891 uint16x8_t __ret; 17892 __ret = __p0 + __p1 * (uint16x8_t) {__p2, __p2, __p2, __p2, __p2, __p2, __p2, __p2}; 17893 return __ret; 17894 } 17895 #else 17896 __ai __attribute__((target("neon"))) uint16x8_t vmlaq_n_u16(uint16x8_t __p0, uint16x8_t __p1, uint16_t __p2) { 17897 uint16x8_t __ret; 17898 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 17899 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 17900 __ret = __rev0 + __rev1 * (uint16x8_t) {__p2, __p2, __p2, __p2, __p2, __p2, __p2, __p2}; 17901 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 17902 return __ret; 17903 } 17904 #endif 17905 17906 #ifdef __LITTLE_ENDIAN__ 17907 __ai __attribute__((target("neon"))) float32x4_t vmlaq_n_f32(float32x4_t __p0, float32x4_t __p1, float32_t __p2) { 17908 float32x4_t __ret; 17909 __ret = __p0 + __p1 * (float32x4_t) {__p2, __p2, __p2, __p2}; 17910 return __ret; 17911 } 17912 #else 17913 __ai __attribute__((target("neon"))) float32x4_t vmlaq_n_f32(float32x4_t __p0, float32x4_t __p1, float32_t __p2) { 17914 float32x4_t __ret; 17915 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 17916 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 17917 __ret = __rev0 + __rev1 * (float32x4_t) {__p2, __p2, __p2, __p2}; 17918 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 17919 return __ret; 17920 } 17921 #endif 17922 17923 #ifdef __LITTLE_ENDIAN__ 17924 __ai __attribute__((target("neon"))) int32x4_t vmlaq_n_s32(int32x4_t __p0, int32x4_t __p1, int32_t __p2) { 17925 int32x4_t __ret; 17926 __ret = __p0 + __p1 * (int32x4_t) {__p2, __p2, __p2, __p2}; 17927 return __ret; 17928 } 17929 #else 17930 __ai __attribute__((target("neon"))) int32x4_t vmlaq_n_s32(int32x4_t __p0, int32x4_t __p1, int32_t __p2) { 17931 int32x4_t __ret; 17932 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 17933 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 17934 __ret = __rev0 + __rev1 * (int32x4_t) {__p2, __p2, __p2, __p2}; 17935 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 17936 return __ret; 17937 } 17938 #endif 17939 17940 #ifdef __LITTLE_ENDIAN__ 17941 __ai __attribute__((target("neon"))) int16x8_t vmlaq_n_s16(int16x8_t __p0, int16x8_t __p1, int16_t __p2) { 17942 int16x8_t __ret; 17943 __ret = __p0 + __p1 * (int16x8_t) {__p2, __p2, __p2, __p2, __p2, __p2, __p2, __p2}; 17944 return __ret; 17945 } 17946 #else 17947 __ai __attribute__((target("neon"))) int16x8_t vmlaq_n_s16(int16x8_t __p0, int16x8_t __p1, int16_t __p2) { 17948 int16x8_t __ret; 17949 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 17950 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 17951 __ret = __rev0 + __rev1 * (int16x8_t) {__p2, __p2, __p2, __p2, __p2, __p2, __p2, __p2}; 17952 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 17953 return __ret; 17954 } 17955 #endif 17956 17957 #ifdef __LITTLE_ENDIAN__ 17958 __ai __attribute__((target("neon"))) uint32x2_t vmla_n_u32(uint32x2_t __p0, uint32x2_t __p1, uint32_t __p2) { 17959 uint32x2_t __ret; 17960 __ret = __p0 + __p1 * (uint32x2_t) {__p2, __p2}; 17961 return __ret; 17962 } 17963 #else 17964 __ai __attribute__((target("neon"))) uint32x2_t vmla_n_u32(uint32x2_t __p0, uint32x2_t __p1, uint32_t __p2) { 17965 uint32x2_t __ret; 17966 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 17967 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 17968 __ret = __rev0 + __rev1 * (uint32x2_t) {__p2, __p2}; 17969 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 17970 return __ret; 17971 } 17972 #endif 17973 17974 #ifdef __LITTLE_ENDIAN__ 17975 __ai __attribute__((target("neon"))) uint16x4_t vmla_n_u16(uint16x4_t __p0, uint16x4_t __p1, uint16_t __p2) { 17976 uint16x4_t __ret; 17977 __ret = __p0 + __p1 * (uint16x4_t) {__p2, __p2, __p2, __p2}; 17978 return __ret; 17979 } 17980 #else 17981 __ai __attribute__((target("neon"))) uint16x4_t vmla_n_u16(uint16x4_t __p0, uint16x4_t __p1, uint16_t __p2) { 17982 uint16x4_t __ret; 17983 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 17984 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 17985 __ret = __rev0 + __rev1 * (uint16x4_t) {__p2, __p2, __p2, __p2}; 17986 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 17987 return __ret; 17988 } 17989 #endif 17990 17991 #ifdef __LITTLE_ENDIAN__ 17992 __ai __attribute__((target("neon"))) float32x2_t vmla_n_f32(float32x2_t __p0, float32x2_t __p1, float32_t __p2) { 17993 float32x2_t __ret; 17994 __ret = __p0 + __p1 * (float32x2_t) {__p2, __p2}; 17995 return __ret; 17996 } 17997 #else 17998 __ai __attribute__((target("neon"))) float32x2_t vmla_n_f32(float32x2_t __p0, float32x2_t __p1, float32_t __p2) { 17999 float32x2_t __ret; 18000 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 18001 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 18002 __ret = __rev0 + __rev1 * (float32x2_t) {__p2, __p2}; 18003 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 18004 return __ret; 18005 } 18006 #endif 18007 18008 #ifdef __LITTLE_ENDIAN__ 18009 __ai __attribute__((target("neon"))) int32x2_t vmla_n_s32(int32x2_t __p0, int32x2_t __p1, int32_t __p2) { 18010 int32x2_t __ret; 18011 __ret = __p0 + __p1 * (int32x2_t) {__p2, __p2}; 18012 return __ret; 18013 } 18014 #else 18015 __ai __attribute__((target("neon"))) int32x2_t vmla_n_s32(int32x2_t __p0, int32x2_t __p1, int32_t __p2) { 18016 int32x2_t __ret; 18017 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 18018 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 18019 __ret = __rev0 + __rev1 * (int32x2_t) {__p2, __p2}; 18020 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 18021 return __ret; 18022 } 18023 #endif 18024 18025 #ifdef __LITTLE_ENDIAN__ 18026 __ai __attribute__((target("neon"))) int16x4_t vmla_n_s16(int16x4_t __p0, int16x4_t __p1, int16_t __p2) { 18027 int16x4_t __ret; 18028 __ret = __p0 + __p1 * (int16x4_t) {__p2, __p2, __p2, __p2}; 18029 return __ret; 18030 } 18031 #else 18032 __ai __attribute__((target("neon"))) int16x4_t vmla_n_s16(int16x4_t __p0, int16x4_t __p1, int16_t __p2) { 18033 int16x4_t __ret; 18034 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 18035 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 18036 __ret = __rev0 + __rev1 * (int16x4_t) {__p2, __p2, __p2, __p2}; 18037 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 18038 return __ret; 18039 } 18040 #endif 18041 18042 #ifdef __LITTLE_ENDIAN__ 18043 __ai __attribute__((target("neon"))) uint8x16_t vmlsq_u8(uint8x16_t __p0, uint8x16_t __p1, uint8x16_t __p2) { 18044 uint8x16_t __ret; 18045 __ret = __p0 - __p1 * __p2; 18046 return __ret; 18047 } 18048 #else 18049 __ai __attribute__((target("neon"))) uint8x16_t vmlsq_u8(uint8x16_t __p0, uint8x16_t __p1, uint8x16_t __p2) { 18050 uint8x16_t __ret; 18051 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 18052 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 18053 uint8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 18054 __ret = __rev0 - __rev1 * __rev2; 18055 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 18056 return __ret; 18057 } 18058 #endif 18059 18060 #ifdef __LITTLE_ENDIAN__ 18061 __ai __attribute__((target("neon"))) uint32x4_t vmlsq_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 18062 uint32x4_t __ret; 18063 __ret = __p0 - __p1 * __p2; 18064 return __ret; 18065 } 18066 #else 18067 __ai __attribute__((target("neon"))) uint32x4_t vmlsq_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 18068 uint32x4_t __ret; 18069 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 18070 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 18071 uint32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 18072 __ret = __rev0 - __rev1 * __rev2; 18073 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 18074 return __ret; 18075 } 18076 #endif 18077 18078 #ifdef __LITTLE_ENDIAN__ 18079 __ai __attribute__((target("neon"))) uint16x8_t vmlsq_u16(uint16x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) { 18080 uint16x8_t __ret; 18081 __ret = __p0 - __p1 * __p2; 18082 return __ret; 18083 } 18084 #else 18085 __ai __attribute__((target("neon"))) uint16x8_t vmlsq_u16(uint16x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) { 18086 uint16x8_t __ret; 18087 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 18088 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 18089 uint16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 18090 __ret = __rev0 - __rev1 * __rev2; 18091 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 18092 return __ret; 18093 } 18094 #endif 18095 18096 #ifdef __LITTLE_ENDIAN__ 18097 __ai __attribute__((target("neon"))) int8x16_t vmlsq_s8(int8x16_t __p0, int8x16_t __p1, int8x16_t __p2) { 18098 int8x16_t __ret; 18099 __ret = __p0 - __p1 * __p2; 18100 return __ret; 18101 } 18102 #else 18103 __ai __attribute__((target("neon"))) int8x16_t vmlsq_s8(int8x16_t __p0, int8x16_t __p1, int8x16_t __p2) { 18104 int8x16_t __ret; 18105 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 18106 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 18107 int8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 18108 __ret = __rev0 - __rev1 * __rev2; 18109 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 18110 return __ret; 18111 } 18112 #endif 18113 18114 #ifdef __LITTLE_ENDIAN__ 18115 __ai __attribute__((target("neon"))) float32x4_t vmlsq_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) { 18116 float32x4_t __ret; 18117 __ret = __p0 - __p1 * __p2; 18118 return __ret; 18119 } 18120 #else 18121 __ai __attribute__((target("neon"))) float32x4_t vmlsq_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) { 18122 float32x4_t __ret; 18123 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 18124 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 18125 float32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 18126 __ret = __rev0 - __rev1 * __rev2; 18127 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 18128 return __ret; 18129 } 18130 #endif 18131 18132 #ifdef __LITTLE_ENDIAN__ 18133 __ai __attribute__((target("neon"))) int32x4_t vmlsq_s32(int32x4_t __p0, int32x4_t __p1, int32x4_t __p2) { 18134 int32x4_t __ret; 18135 __ret = __p0 - __p1 * __p2; 18136 return __ret; 18137 } 18138 #else 18139 __ai __attribute__((target("neon"))) int32x4_t vmlsq_s32(int32x4_t __p0, int32x4_t __p1, int32x4_t __p2) { 18140 int32x4_t __ret; 18141 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 18142 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 18143 int32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 18144 __ret = __rev0 - __rev1 * __rev2; 18145 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 18146 return __ret; 18147 } 18148 #endif 18149 18150 #ifdef __LITTLE_ENDIAN__ 18151 __ai __attribute__((target("neon"))) int16x8_t vmlsq_s16(int16x8_t __p0, int16x8_t __p1, int16x8_t __p2) { 18152 int16x8_t __ret; 18153 __ret = __p0 - __p1 * __p2; 18154 return __ret; 18155 } 18156 #else 18157 __ai __attribute__((target("neon"))) int16x8_t vmlsq_s16(int16x8_t __p0, int16x8_t __p1, int16x8_t __p2) { 18158 int16x8_t __ret; 18159 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 18160 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 18161 int16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 18162 __ret = __rev0 - __rev1 * __rev2; 18163 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 18164 return __ret; 18165 } 18166 #endif 18167 18168 #ifdef __LITTLE_ENDIAN__ 18169 __ai __attribute__((target("neon"))) uint8x8_t vmls_u8(uint8x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) { 18170 uint8x8_t __ret; 18171 __ret = __p0 - __p1 * __p2; 18172 return __ret; 18173 } 18174 #else 18175 __ai __attribute__((target("neon"))) uint8x8_t vmls_u8(uint8x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) { 18176 uint8x8_t __ret; 18177 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 18178 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 18179 uint8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 18180 __ret = __rev0 - __rev1 * __rev2; 18181 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 18182 return __ret; 18183 } 18184 #endif 18185 18186 #ifdef __LITTLE_ENDIAN__ 18187 __ai __attribute__((target("neon"))) uint32x2_t vmls_u32(uint32x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) { 18188 uint32x2_t __ret; 18189 __ret = __p0 - __p1 * __p2; 18190 return __ret; 18191 } 18192 #else 18193 __ai __attribute__((target("neon"))) uint32x2_t vmls_u32(uint32x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) { 18194 uint32x2_t __ret; 18195 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 18196 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 18197 uint32x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 18198 __ret = __rev0 - __rev1 * __rev2; 18199 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 18200 return __ret; 18201 } 18202 #endif 18203 18204 #ifdef __LITTLE_ENDIAN__ 18205 __ai __attribute__((target("neon"))) uint16x4_t vmls_u16(uint16x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) { 18206 uint16x4_t __ret; 18207 __ret = __p0 - __p1 * __p2; 18208 return __ret; 18209 } 18210 #else 18211 __ai __attribute__((target("neon"))) uint16x4_t vmls_u16(uint16x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) { 18212 uint16x4_t __ret; 18213 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 18214 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 18215 uint16x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 18216 __ret = __rev0 - __rev1 * __rev2; 18217 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 18218 return __ret; 18219 } 18220 #endif 18221 18222 #ifdef __LITTLE_ENDIAN__ 18223 __ai __attribute__((target("neon"))) int8x8_t vmls_s8(int8x8_t __p0, int8x8_t __p1, int8x8_t __p2) { 18224 int8x8_t __ret; 18225 __ret = __p0 - __p1 * __p2; 18226 return __ret; 18227 } 18228 #else 18229 __ai __attribute__((target("neon"))) int8x8_t vmls_s8(int8x8_t __p0, int8x8_t __p1, int8x8_t __p2) { 18230 int8x8_t __ret; 18231 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 18232 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 18233 int8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 18234 __ret = __rev0 - __rev1 * __rev2; 18235 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 18236 return __ret; 18237 } 18238 #endif 18239 18240 #ifdef __LITTLE_ENDIAN__ 18241 __ai __attribute__((target("neon"))) float32x2_t vmls_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) { 18242 float32x2_t __ret; 18243 __ret = __p0 - __p1 * __p2; 18244 return __ret; 18245 } 18246 #else 18247 __ai __attribute__((target("neon"))) float32x2_t vmls_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) { 18248 float32x2_t __ret; 18249 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 18250 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 18251 float32x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 18252 __ret = __rev0 - __rev1 * __rev2; 18253 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 18254 return __ret; 18255 } 18256 #endif 18257 18258 #ifdef __LITTLE_ENDIAN__ 18259 __ai __attribute__((target("neon"))) int32x2_t vmls_s32(int32x2_t __p0, int32x2_t __p1, int32x2_t __p2) { 18260 int32x2_t __ret; 18261 __ret = __p0 - __p1 * __p2; 18262 return __ret; 18263 } 18264 #else 18265 __ai __attribute__((target("neon"))) int32x2_t vmls_s32(int32x2_t __p0, int32x2_t __p1, int32x2_t __p2) { 18266 int32x2_t __ret; 18267 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 18268 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 18269 int32x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 18270 __ret = __rev0 - __rev1 * __rev2; 18271 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 18272 return __ret; 18273 } 18274 #endif 18275 18276 #ifdef __LITTLE_ENDIAN__ 18277 __ai __attribute__((target("neon"))) int16x4_t vmls_s16(int16x4_t __p0, int16x4_t __p1, int16x4_t __p2) { 18278 int16x4_t __ret; 18279 __ret = __p0 - __p1 * __p2; 18280 return __ret; 18281 } 18282 #else 18283 __ai __attribute__((target("neon"))) int16x4_t vmls_s16(int16x4_t __p0, int16x4_t __p1, int16x4_t __p2) { 18284 int16x4_t __ret; 18285 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 18286 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 18287 int16x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 18288 __ret = __rev0 - __rev1 * __rev2; 18289 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 18290 return __ret; 18291 } 18292 #endif 18293 18294 #ifdef __LITTLE_ENDIAN__ 18295 #define vmlsq_lane_u32(__p0_74, __p1_74, __p2_74, __p3_74) __extension__ ({ \ 18296 uint32x4_t __ret_74; \ 18297 uint32x4_t __s0_74 = __p0_74; \ 18298 uint32x4_t __s1_74 = __p1_74; \ 18299 uint32x2_t __s2_74 = __p2_74; \ 18300 __ret_74 = __s0_74 - __s1_74 * splatq_lane_u32(__s2_74, __p3_74); \ 18301 __ret_74; \ 18302 }) 18303 #else 18304 #define vmlsq_lane_u32(__p0_75, __p1_75, __p2_75, __p3_75) __extension__ ({ \ 18305 uint32x4_t __ret_75; \ 18306 uint32x4_t __s0_75 = __p0_75; \ 18307 uint32x4_t __s1_75 = __p1_75; \ 18308 uint32x2_t __s2_75 = __p2_75; \ 18309 uint32x4_t __rev0_75; __rev0_75 = __builtin_shufflevector(__s0_75, __s0_75, 3, 2, 1, 0); \ 18310 uint32x4_t __rev1_75; __rev1_75 = __builtin_shufflevector(__s1_75, __s1_75, 3, 2, 1, 0); \ 18311 uint32x2_t __rev2_75; __rev2_75 = __builtin_shufflevector(__s2_75, __s2_75, 1, 0); \ 18312 __ret_75 = __rev0_75 - __rev1_75 * __noswap_splatq_lane_u32(__rev2_75, __p3_75); \ 18313 __ret_75 = __builtin_shufflevector(__ret_75, __ret_75, 3, 2, 1, 0); \ 18314 __ret_75; \ 18315 }) 18316 #endif 18317 18318 #ifdef __LITTLE_ENDIAN__ 18319 #define vmlsq_lane_u16(__p0_76, __p1_76, __p2_76, __p3_76) __extension__ ({ \ 18320 uint16x8_t __ret_76; \ 18321 uint16x8_t __s0_76 = __p0_76; \ 18322 uint16x8_t __s1_76 = __p1_76; \ 18323 uint16x4_t __s2_76 = __p2_76; \ 18324 __ret_76 = __s0_76 - __s1_76 * splatq_lane_u16(__s2_76, __p3_76); \ 18325 __ret_76; \ 18326 }) 18327 #else 18328 #define vmlsq_lane_u16(__p0_77, __p1_77, __p2_77, __p3_77) __extension__ ({ \ 18329 uint16x8_t __ret_77; \ 18330 uint16x8_t __s0_77 = __p0_77; \ 18331 uint16x8_t __s1_77 = __p1_77; \ 18332 uint16x4_t __s2_77 = __p2_77; \ 18333 uint16x8_t __rev0_77; __rev0_77 = __builtin_shufflevector(__s0_77, __s0_77, 7, 6, 5, 4, 3, 2, 1, 0); \ 18334 uint16x8_t __rev1_77; __rev1_77 = __builtin_shufflevector(__s1_77, __s1_77, 7, 6, 5, 4, 3, 2, 1, 0); \ 18335 uint16x4_t __rev2_77; __rev2_77 = __builtin_shufflevector(__s2_77, __s2_77, 3, 2, 1, 0); \ 18336 __ret_77 = __rev0_77 - __rev1_77 * __noswap_splatq_lane_u16(__rev2_77, __p3_77); \ 18337 __ret_77 = __builtin_shufflevector(__ret_77, __ret_77, 7, 6, 5, 4, 3, 2, 1, 0); \ 18338 __ret_77; \ 18339 }) 18340 #endif 18341 18342 #ifdef __LITTLE_ENDIAN__ 18343 #define vmlsq_lane_f32(__p0_78, __p1_78, __p2_78, __p3_78) __extension__ ({ \ 18344 float32x4_t __ret_78; \ 18345 float32x4_t __s0_78 = __p0_78; \ 18346 float32x4_t __s1_78 = __p1_78; \ 18347 float32x2_t __s2_78 = __p2_78; \ 18348 __ret_78 = __s0_78 - __s1_78 * splatq_lane_f32(__s2_78, __p3_78); \ 18349 __ret_78; \ 18350 }) 18351 #else 18352 #define vmlsq_lane_f32(__p0_79, __p1_79, __p2_79, __p3_79) __extension__ ({ \ 18353 float32x4_t __ret_79; \ 18354 float32x4_t __s0_79 = __p0_79; \ 18355 float32x4_t __s1_79 = __p1_79; \ 18356 float32x2_t __s2_79 = __p2_79; \ 18357 float32x4_t __rev0_79; __rev0_79 = __builtin_shufflevector(__s0_79, __s0_79, 3, 2, 1, 0); \ 18358 float32x4_t __rev1_79; __rev1_79 = __builtin_shufflevector(__s1_79, __s1_79, 3, 2, 1, 0); \ 18359 float32x2_t __rev2_79; __rev2_79 = __builtin_shufflevector(__s2_79, __s2_79, 1, 0); \ 18360 __ret_79 = __rev0_79 - __rev1_79 * __noswap_splatq_lane_f32(__rev2_79, __p3_79); \ 18361 __ret_79 = __builtin_shufflevector(__ret_79, __ret_79, 3, 2, 1, 0); \ 18362 __ret_79; \ 18363 }) 18364 #endif 18365 18366 #ifdef __LITTLE_ENDIAN__ 18367 #define vmlsq_lane_s32(__p0_80, __p1_80, __p2_80, __p3_80) __extension__ ({ \ 18368 int32x4_t __ret_80; \ 18369 int32x4_t __s0_80 = __p0_80; \ 18370 int32x4_t __s1_80 = __p1_80; \ 18371 int32x2_t __s2_80 = __p2_80; \ 18372 __ret_80 = __s0_80 - __s1_80 * splatq_lane_s32(__s2_80, __p3_80); \ 18373 __ret_80; \ 18374 }) 18375 #else 18376 #define vmlsq_lane_s32(__p0_81, __p1_81, __p2_81, __p3_81) __extension__ ({ \ 18377 int32x4_t __ret_81; \ 18378 int32x4_t __s0_81 = __p0_81; \ 18379 int32x4_t __s1_81 = __p1_81; \ 18380 int32x2_t __s2_81 = __p2_81; \ 18381 int32x4_t __rev0_81; __rev0_81 = __builtin_shufflevector(__s0_81, __s0_81, 3, 2, 1, 0); \ 18382 int32x4_t __rev1_81; __rev1_81 = __builtin_shufflevector(__s1_81, __s1_81, 3, 2, 1, 0); \ 18383 int32x2_t __rev2_81; __rev2_81 = __builtin_shufflevector(__s2_81, __s2_81, 1, 0); \ 18384 __ret_81 = __rev0_81 - __rev1_81 * __noswap_splatq_lane_s32(__rev2_81, __p3_81); \ 18385 __ret_81 = __builtin_shufflevector(__ret_81, __ret_81, 3, 2, 1, 0); \ 18386 __ret_81; \ 18387 }) 18388 #endif 18389 18390 #ifdef __LITTLE_ENDIAN__ 18391 #define vmlsq_lane_s16(__p0_82, __p1_82, __p2_82, __p3_82) __extension__ ({ \ 18392 int16x8_t __ret_82; \ 18393 int16x8_t __s0_82 = __p0_82; \ 18394 int16x8_t __s1_82 = __p1_82; \ 18395 int16x4_t __s2_82 = __p2_82; \ 18396 __ret_82 = __s0_82 - __s1_82 * splatq_lane_s16(__s2_82, __p3_82); \ 18397 __ret_82; \ 18398 }) 18399 #else 18400 #define vmlsq_lane_s16(__p0_83, __p1_83, __p2_83, __p3_83) __extension__ ({ \ 18401 int16x8_t __ret_83; \ 18402 int16x8_t __s0_83 = __p0_83; \ 18403 int16x8_t __s1_83 = __p1_83; \ 18404 int16x4_t __s2_83 = __p2_83; \ 18405 int16x8_t __rev0_83; __rev0_83 = __builtin_shufflevector(__s0_83, __s0_83, 7, 6, 5, 4, 3, 2, 1, 0); \ 18406 int16x8_t __rev1_83; __rev1_83 = __builtin_shufflevector(__s1_83, __s1_83, 7, 6, 5, 4, 3, 2, 1, 0); \ 18407 int16x4_t __rev2_83; __rev2_83 = __builtin_shufflevector(__s2_83, __s2_83, 3, 2, 1, 0); \ 18408 __ret_83 = __rev0_83 - __rev1_83 * __noswap_splatq_lane_s16(__rev2_83, __p3_83); \ 18409 __ret_83 = __builtin_shufflevector(__ret_83, __ret_83, 7, 6, 5, 4, 3, 2, 1, 0); \ 18410 __ret_83; \ 18411 }) 18412 #endif 18413 18414 #ifdef __LITTLE_ENDIAN__ 18415 #define vmls_lane_u32(__p0_84, __p1_84, __p2_84, __p3_84) __extension__ ({ \ 18416 uint32x2_t __ret_84; \ 18417 uint32x2_t __s0_84 = __p0_84; \ 18418 uint32x2_t __s1_84 = __p1_84; \ 18419 uint32x2_t __s2_84 = __p2_84; \ 18420 __ret_84 = __s0_84 - __s1_84 * splat_lane_u32(__s2_84, __p3_84); \ 18421 __ret_84; \ 18422 }) 18423 #else 18424 #define vmls_lane_u32(__p0_85, __p1_85, __p2_85, __p3_85) __extension__ ({ \ 18425 uint32x2_t __ret_85; \ 18426 uint32x2_t __s0_85 = __p0_85; \ 18427 uint32x2_t __s1_85 = __p1_85; \ 18428 uint32x2_t __s2_85 = __p2_85; \ 18429 uint32x2_t __rev0_85; __rev0_85 = __builtin_shufflevector(__s0_85, __s0_85, 1, 0); \ 18430 uint32x2_t __rev1_85; __rev1_85 = __builtin_shufflevector(__s1_85, __s1_85, 1, 0); \ 18431 uint32x2_t __rev2_85; __rev2_85 = __builtin_shufflevector(__s2_85, __s2_85, 1, 0); \ 18432 __ret_85 = __rev0_85 - __rev1_85 * __noswap_splat_lane_u32(__rev2_85, __p3_85); \ 18433 __ret_85 = __builtin_shufflevector(__ret_85, __ret_85, 1, 0); \ 18434 __ret_85; \ 18435 }) 18436 #endif 18437 18438 #ifdef __LITTLE_ENDIAN__ 18439 #define vmls_lane_u16(__p0_86, __p1_86, __p2_86, __p3_86) __extension__ ({ \ 18440 uint16x4_t __ret_86; \ 18441 uint16x4_t __s0_86 = __p0_86; \ 18442 uint16x4_t __s1_86 = __p1_86; \ 18443 uint16x4_t __s2_86 = __p2_86; \ 18444 __ret_86 = __s0_86 - __s1_86 * splat_lane_u16(__s2_86, __p3_86); \ 18445 __ret_86; \ 18446 }) 18447 #else 18448 #define vmls_lane_u16(__p0_87, __p1_87, __p2_87, __p3_87) __extension__ ({ \ 18449 uint16x4_t __ret_87; \ 18450 uint16x4_t __s0_87 = __p0_87; \ 18451 uint16x4_t __s1_87 = __p1_87; \ 18452 uint16x4_t __s2_87 = __p2_87; \ 18453 uint16x4_t __rev0_87; __rev0_87 = __builtin_shufflevector(__s0_87, __s0_87, 3, 2, 1, 0); \ 18454 uint16x4_t __rev1_87; __rev1_87 = __builtin_shufflevector(__s1_87, __s1_87, 3, 2, 1, 0); \ 18455 uint16x4_t __rev2_87; __rev2_87 = __builtin_shufflevector(__s2_87, __s2_87, 3, 2, 1, 0); \ 18456 __ret_87 = __rev0_87 - __rev1_87 * __noswap_splat_lane_u16(__rev2_87, __p3_87); \ 18457 __ret_87 = __builtin_shufflevector(__ret_87, __ret_87, 3, 2, 1, 0); \ 18458 __ret_87; \ 18459 }) 18460 #endif 18461 18462 #ifdef __LITTLE_ENDIAN__ 18463 #define vmls_lane_f32(__p0_88, __p1_88, __p2_88, __p3_88) __extension__ ({ \ 18464 float32x2_t __ret_88; \ 18465 float32x2_t __s0_88 = __p0_88; \ 18466 float32x2_t __s1_88 = __p1_88; \ 18467 float32x2_t __s2_88 = __p2_88; \ 18468 __ret_88 = __s0_88 - __s1_88 * splat_lane_f32(__s2_88, __p3_88); \ 18469 __ret_88; \ 18470 }) 18471 #else 18472 #define vmls_lane_f32(__p0_89, __p1_89, __p2_89, __p3_89) __extension__ ({ \ 18473 float32x2_t __ret_89; \ 18474 float32x2_t __s0_89 = __p0_89; \ 18475 float32x2_t __s1_89 = __p1_89; \ 18476 float32x2_t __s2_89 = __p2_89; \ 18477 float32x2_t __rev0_89; __rev0_89 = __builtin_shufflevector(__s0_89, __s0_89, 1, 0); \ 18478 float32x2_t __rev1_89; __rev1_89 = __builtin_shufflevector(__s1_89, __s1_89, 1, 0); \ 18479 float32x2_t __rev2_89; __rev2_89 = __builtin_shufflevector(__s2_89, __s2_89, 1, 0); \ 18480 __ret_89 = __rev0_89 - __rev1_89 * __noswap_splat_lane_f32(__rev2_89, __p3_89); \ 18481 __ret_89 = __builtin_shufflevector(__ret_89, __ret_89, 1, 0); \ 18482 __ret_89; \ 18483 }) 18484 #endif 18485 18486 #ifdef __LITTLE_ENDIAN__ 18487 #define vmls_lane_s32(__p0_90, __p1_90, __p2_90, __p3_90) __extension__ ({ \ 18488 int32x2_t __ret_90; \ 18489 int32x2_t __s0_90 = __p0_90; \ 18490 int32x2_t __s1_90 = __p1_90; \ 18491 int32x2_t __s2_90 = __p2_90; \ 18492 __ret_90 = __s0_90 - __s1_90 * splat_lane_s32(__s2_90, __p3_90); \ 18493 __ret_90; \ 18494 }) 18495 #else 18496 #define vmls_lane_s32(__p0_91, __p1_91, __p2_91, __p3_91) __extension__ ({ \ 18497 int32x2_t __ret_91; \ 18498 int32x2_t __s0_91 = __p0_91; \ 18499 int32x2_t __s1_91 = __p1_91; \ 18500 int32x2_t __s2_91 = __p2_91; \ 18501 int32x2_t __rev0_91; __rev0_91 = __builtin_shufflevector(__s0_91, __s0_91, 1, 0); \ 18502 int32x2_t __rev1_91; __rev1_91 = __builtin_shufflevector(__s1_91, __s1_91, 1, 0); \ 18503 int32x2_t __rev2_91; __rev2_91 = __builtin_shufflevector(__s2_91, __s2_91, 1, 0); \ 18504 __ret_91 = __rev0_91 - __rev1_91 * __noswap_splat_lane_s32(__rev2_91, __p3_91); \ 18505 __ret_91 = __builtin_shufflevector(__ret_91, __ret_91, 1, 0); \ 18506 __ret_91; \ 18507 }) 18508 #endif 18509 18510 #ifdef __LITTLE_ENDIAN__ 18511 #define vmls_lane_s16(__p0_92, __p1_92, __p2_92, __p3_92) __extension__ ({ \ 18512 int16x4_t __ret_92; \ 18513 int16x4_t __s0_92 = __p0_92; \ 18514 int16x4_t __s1_92 = __p1_92; \ 18515 int16x4_t __s2_92 = __p2_92; \ 18516 __ret_92 = __s0_92 - __s1_92 * splat_lane_s16(__s2_92, __p3_92); \ 18517 __ret_92; \ 18518 }) 18519 #else 18520 #define vmls_lane_s16(__p0_93, __p1_93, __p2_93, __p3_93) __extension__ ({ \ 18521 int16x4_t __ret_93; \ 18522 int16x4_t __s0_93 = __p0_93; \ 18523 int16x4_t __s1_93 = __p1_93; \ 18524 int16x4_t __s2_93 = __p2_93; \ 18525 int16x4_t __rev0_93; __rev0_93 = __builtin_shufflevector(__s0_93, __s0_93, 3, 2, 1, 0); \ 18526 int16x4_t __rev1_93; __rev1_93 = __builtin_shufflevector(__s1_93, __s1_93, 3, 2, 1, 0); \ 18527 int16x4_t __rev2_93; __rev2_93 = __builtin_shufflevector(__s2_93, __s2_93, 3, 2, 1, 0); \ 18528 __ret_93 = __rev0_93 - __rev1_93 * __noswap_splat_lane_s16(__rev2_93, __p3_93); \ 18529 __ret_93 = __builtin_shufflevector(__ret_93, __ret_93, 3, 2, 1, 0); \ 18530 __ret_93; \ 18531 }) 18532 #endif 18533 18534 #ifdef __LITTLE_ENDIAN__ 18535 __ai __attribute__((target("neon"))) uint32x4_t vmlsq_n_u32(uint32x4_t __p0, uint32x4_t __p1, uint32_t __p2) { 18536 uint32x4_t __ret; 18537 __ret = __p0 - __p1 * (uint32x4_t) {__p2, __p2, __p2, __p2}; 18538 return __ret; 18539 } 18540 #else 18541 __ai __attribute__((target("neon"))) uint32x4_t vmlsq_n_u32(uint32x4_t __p0, uint32x4_t __p1, uint32_t __p2) { 18542 uint32x4_t __ret; 18543 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 18544 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 18545 __ret = __rev0 - __rev1 * (uint32x4_t) {__p2, __p2, __p2, __p2}; 18546 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 18547 return __ret; 18548 } 18549 #endif 18550 18551 #ifdef __LITTLE_ENDIAN__ 18552 __ai __attribute__((target("neon"))) uint16x8_t vmlsq_n_u16(uint16x8_t __p0, uint16x8_t __p1, uint16_t __p2) { 18553 uint16x8_t __ret; 18554 __ret = __p0 - __p1 * (uint16x8_t) {__p2, __p2, __p2, __p2, __p2, __p2, __p2, __p2}; 18555 return __ret; 18556 } 18557 #else 18558 __ai __attribute__((target("neon"))) uint16x8_t vmlsq_n_u16(uint16x8_t __p0, uint16x8_t __p1, uint16_t __p2) { 18559 uint16x8_t __ret; 18560 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 18561 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 18562 __ret = __rev0 - __rev1 * (uint16x8_t) {__p2, __p2, __p2, __p2, __p2, __p2, __p2, __p2}; 18563 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 18564 return __ret; 18565 } 18566 #endif 18567 18568 #ifdef __LITTLE_ENDIAN__ 18569 __ai __attribute__((target("neon"))) float32x4_t vmlsq_n_f32(float32x4_t __p0, float32x4_t __p1, float32_t __p2) { 18570 float32x4_t __ret; 18571 __ret = __p0 - __p1 * (float32x4_t) {__p2, __p2, __p2, __p2}; 18572 return __ret; 18573 } 18574 #else 18575 __ai __attribute__((target("neon"))) float32x4_t vmlsq_n_f32(float32x4_t __p0, float32x4_t __p1, float32_t __p2) { 18576 float32x4_t __ret; 18577 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 18578 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 18579 __ret = __rev0 - __rev1 * (float32x4_t) {__p2, __p2, __p2, __p2}; 18580 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 18581 return __ret; 18582 } 18583 #endif 18584 18585 #ifdef __LITTLE_ENDIAN__ 18586 __ai __attribute__((target("neon"))) int32x4_t vmlsq_n_s32(int32x4_t __p0, int32x4_t __p1, int32_t __p2) { 18587 int32x4_t __ret; 18588 __ret = __p0 - __p1 * (int32x4_t) {__p2, __p2, __p2, __p2}; 18589 return __ret; 18590 } 18591 #else 18592 __ai __attribute__((target("neon"))) int32x4_t vmlsq_n_s32(int32x4_t __p0, int32x4_t __p1, int32_t __p2) { 18593 int32x4_t __ret; 18594 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 18595 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 18596 __ret = __rev0 - __rev1 * (int32x4_t) {__p2, __p2, __p2, __p2}; 18597 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 18598 return __ret; 18599 } 18600 #endif 18601 18602 #ifdef __LITTLE_ENDIAN__ 18603 __ai __attribute__((target("neon"))) int16x8_t vmlsq_n_s16(int16x8_t __p0, int16x8_t __p1, int16_t __p2) { 18604 int16x8_t __ret; 18605 __ret = __p0 - __p1 * (int16x8_t) {__p2, __p2, __p2, __p2, __p2, __p2, __p2, __p2}; 18606 return __ret; 18607 } 18608 #else 18609 __ai __attribute__((target("neon"))) int16x8_t vmlsq_n_s16(int16x8_t __p0, int16x8_t __p1, int16_t __p2) { 18610 int16x8_t __ret; 18611 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 18612 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 18613 __ret = __rev0 - __rev1 * (int16x8_t) {__p2, __p2, __p2, __p2, __p2, __p2, __p2, __p2}; 18614 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 18615 return __ret; 18616 } 18617 #endif 18618 18619 #ifdef __LITTLE_ENDIAN__ 18620 __ai __attribute__((target("neon"))) uint32x2_t vmls_n_u32(uint32x2_t __p0, uint32x2_t __p1, uint32_t __p2) { 18621 uint32x2_t __ret; 18622 __ret = __p0 - __p1 * (uint32x2_t) {__p2, __p2}; 18623 return __ret; 18624 } 18625 #else 18626 __ai __attribute__((target("neon"))) uint32x2_t vmls_n_u32(uint32x2_t __p0, uint32x2_t __p1, uint32_t __p2) { 18627 uint32x2_t __ret; 18628 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 18629 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 18630 __ret = __rev0 - __rev1 * (uint32x2_t) {__p2, __p2}; 18631 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 18632 return __ret; 18633 } 18634 #endif 18635 18636 #ifdef __LITTLE_ENDIAN__ 18637 __ai __attribute__((target("neon"))) uint16x4_t vmls_n_u16(uint16x4_t __p0, uint16x4_t __p1, uint16_t __p2) { 18638 uint16x4_t __ret; 18639 __ret = __p0 - __p1 * (uint16x4_t) {__p2, __p2, __p2, __p2}; 18640 return __ret; 18641 } 18642 #else 18643 __ai __attribute__((target("neon"))) uint16x4_t vmls_n_u16(uint16x4_t __p0, uint16x4_t __p1, uint16_t __p2) { 18644 uint16x4_t __ret; 18645 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 18646 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 18647 __ret = __rev0 - __rev1 * (uint16x4_t) {__p2, __p2, __p2, __p2}; 18648 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 18649 return __ret; 18650 } 18651 #endif 18652 18653 #ifdef __LITTLE_ENDIAN__ 18654 __ai __attribute__((target("neon"))) float32x2_t vmls_n_f32(float32x2_t __p0, float32x2_t __p1, float32_t __p2) { 18655 float32x2_t __ret; 18656 __ret = __p0 - __p1 * (float32x2_t) {__p2, __p2}; 18657 return __ret; 18658 } 18659 #else 18660 __ai __attribute__((target("neon"))) float32x2_t vmls_n_f32(float32x2_t __p0, float32x2_t __p1, float32_t __p2) { 18661 float32x2_t __ret; 18662 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 18663 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 18664 __ret = __rev0 - __rev1 * (float32x2_t) {__p2, __p2}; 18665 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 18666 return __ret; 18667 } 18668 #endif 18669 18670 #ifdef __LITTLE_ENDIAN__ 18671 __ai __attribute__((target("neon"))) int32x2_t vmls_n_s32(int32x2_t __p0, int32x2_t __p1, int32_t __p2) { 18672 int32x2_t __ret; 18673 __ret = __p0 - __p1 * (int32x2_t) {__p2, __p2}; 18674 return __ret; 18675 } 18676 #else 18677 __ai __attribute__((target("neon"))) int32x2_t vmls_n_s32(int32x2_t __p0, int32x2_t __p1, int32_t __p2) { 18678 int32x2_t __ret; 18679 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 18680 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 18681 __ret = __rev0 - __rev1 * (int32x2_t) {__p2, __p2}; 18682 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 18683 return __ret; 18684 } 18685 #endif 18686 18687 #ifdef __LITTLE_ENDIAN__ 18688 __ai __attribute__((target("neon"))) int16x4_t vmls_n_s16(int16x4_t __p0, int16x4_t __p1, int16_t __p2) { 18689 int16x4_t __ret; 18690 __ret = __p0 - __p1 * (int16x4_t) {__p2, __p2, __p2, __p2}; 18691 return __ret; 18692 } 18693 #else 18694 __ai __attribute__((target("neon"))) int16x4_t vmls_n_s16(int16x4_t __p0, int16x4_t __p1, int16_t __p2) { 18695 int16x4_t __ret; 18696 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 18697 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 18698 __ret = __rev0 - __rev1 * (int16x4_t) {__p2, __p2, __p2, __p2}; 18699 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 18700 return __ret; 18701 } 18702 #endif 18703 18704 #ifdef __LITTLE_ENDIAN__ 18705 __ai __attribute__((target("neon"))) poly8x8_t vmov_n_p8(poly8_t __p0) { 18706 poly8x8_t __ret; 18707 __ret = (poly8x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 18708 return __ret; 18709 } 18710 #else 18711 __ai __attribute__((target("neon"))) poly8x8_t vmov_n_p8(poly8_t __p0) { 18712 poly8x8_t __ret; 18713 __ret = (poly8x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 18714 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 18715 return __ret; 18716 } 18717 #endif 18718 18719 #ifdef __LITTLE_ENDIAN__ 18720 __ai __attribute__((target("neon"))) poly16x4_t vmov_n_p16(poly16_t __p0) { 18721 poly16x4_t __ret; 18722 __ret = (poly16x4_t) {__p0, __p0, __p0, __p0}; 18723 return __ret; 18724 } 18725 #else 18726 __ai __attribute__((target("neon"))) poly16x4_t vmov_n_p16(poly16_t __p0) { 18727 poly16x4_t __ret; 18728 __ret = (poly16x4_t) {__p0, __p0, __p0, __p0}; 18729 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 18730 return __ret; 18731 } 18732 #endif 18733 18734 #ifdef __LITTLE_ENDIAN__ 18735 __ai __attribute__((target("neon"))) poly8x16_t vmovq_n_p8(poly8_t __p0) { 18736 poly8x16_t __ret; 18737 __ret = (poly8x16_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 18738 return __ret; 18739 } 18740 #else 18741 __ai __attribute__((target("neon"))) poly8x16_t vmovq_n_p8(poly8_t __p0) { 18742 poly8x16_t __ret; 18743 __ret = (poly8x16_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 18744 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 18745 return __ret; 18746 } 18747 #endif 18748 18749 #ifdef __LITTLE_ENDIAN__ 18750 __ai __attribute__((target("neon"))) poly16x8_t vmovq_n_p16(poly16_t __p0) { 18751 poly16x8_t __ret; 18752 __ret = (poly16x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 18753 return __ret; 18754 } 18755 #else 18756 __ai __attribute__((target("neon"))) poly16x8_t vmovq_n_p16(poly16_t __p0) { 18757 poly16x8_t __ret; 18758 __ret = (poly16x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 18759 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 18760 return __ret; 18761 } 18762 #endif 18763 18764 #ifdef __LITTLE_ENDIAN__ 18765 __ai __attribute__((target("neon"))) uint8x16_t vmovq_n_u8(uint8_t __p0) { 18766 uint8x16_t __ret; 18767 __ret = (uint8x16_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 18768 return __ret; 18769 } 18770 #else 18771 __ai __attribute__((target("neon"))) uint8x16_t vmovq_n_u8(uint8_t __p0) { 18772 uint8x16_t __ret; 18773 __ret = (uint8x16_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 18774 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 18775 return __ret; 18776 } 18777 #endif 18778 18779 #ifdef __LITTLE_ENDIAN__ 18780 __ai __attribute__((target("neon"))) uint32x4_t vmovq_n_u32(uint32_t __p0) { 18781 uint32x4_t __ret; 18782 __ret = (uint32x4_t) {__p0, __p0, __p0, __p0}; 18783 return __ret; 18784 } 18785 #else 18786 __ai __attribute__((target("neon"))) uint32x4_t vmovq_n_u32(uint32_t __p0) { 18787 uint32x4_t __ret; 18788 __ret = (uint32x4_t) {__p0, __p0, __p0, __p0}; 18789 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 18790 return __ret; 18791 } 18792 #endif 18793 18794 #ifdef __LITTLE_ENDIAN__ 18795 __ai __attribute__((target("neon"))) uint64x2_t vmovq_n_u64(uint64_t __p0) { 18796 uint64x2_t __ret; 18797 __ret = (uint64x2_t) {__p0, __p0}; 18798 return __ret; 18799 } 18800 #else 18801 __ai __attribute__((target("neon"))) uint64x2_t vmovq_n_u64(uint64_t __p0) { 18802 uint64x2_t __ret; 18803 __ret = (uint64x2_t) {__p0, __p0}; 18804 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 18805 return __ret; 18806 } 18807 #endif 18808 18809 #ifdef __LITTLE_ENDIAN__ 18810 __ai __attribute__((target("neon"))) uint16x8_t vmovq_n_u16(uint16_t __p0) { 18811 uint16x8_t __ret; 18812 __ret = (uint16x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 18813 return __ret; 18814 } 18815 #else 18816 __ai __attribute__((target("neon"))) uint16x8_t vmovq_n_u16(uint16_t __p0) { 18817 uint16x8_t __ret; 18818 __ret = (uint16x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 18819 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 18820 return __ret; 18821 } 18822 #endif 18823 18824 #ifdef __LITTLE_ENDIAN__ 18825 __ai __attribute__((target("neon"))) int8x16_t vmovq_n_s8(int8_t __p0) { 18826 int8x16_t __ret; 18827 __ret = (int8x16_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 18828 return __ret; 18829 } 18830 #else 18831 __ai __attribute__((target("neon"))) int8x16_t vmovq_n_s8(int8_t __p0) { 18832 int8x16_t __ret; 18833 __ret = (int8x16_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 18834 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 18835 return __ret; 18836 } 18837 #endif 18838 18839 #ifdef __LITTLE_ENDIAN__ 18840 __ai __attribute__((target("neon"))) float32x4_t vmovq_n_f32(float32_t __p0) { 18841 float32x4_t __ret; 18842 __ret = (float32x4_t) {__p0, __p0, __p0, __p0}; 18843 return __ret; 18844 } 18845 #else 18846 __ai __attribute__((target("neon"))) float32x4_t vmovq_n_f32(float32_t __p0) { 18847 float32x4_t __ret; 18848 __ret = (float32x4_t) {__p0, __p0, __p0, __p0}; 18849 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 18850 return __ret; 18851 } 18852 #endif 18853 18854 #ifdef __LITTLE_ENDIAN__ 18855 #define vmovq_n_f16(__p0) __extension__ ({ \ 18856 float16x8_t __ret; \ 18857 float16_t __s0 = __p0; \ 18858 __ret = (float16x8_t) {__s0, __s0, __s0, __s0, __s0, __s0, __s0, __s0}; \ 18859 __ret; \ 18860 }) 18861 #else 18862 #define vmovq_n_f16(__p0) __extension__ ({ \ 18863 float16x8_t __ret; \ 18864 float16_t __s0 = __p0; \ 18865 __ret = (float16x8_t) {__s0, __s0, __s0, __s0, __s0, __s0, __s0, __s0}; \ 18866 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 18867 __ret; \ 18868 }) 18869 #endif 18870 18871 #ifdef __LITTLE_ENDIAN__ 18872 __ai __attribute__((target("neon"))) int32x4_t vmovq_n_s32(int32_t __p0) { 18873 int32x4_t __ret; 18874 __ret = (int32x4_t) {__p0, __p0, __p0, __p0}; 18875 return __ret; 18876 } 18877 #else 18878 __ai __attribute__((target("neon"))) int32x4_t vmovq_n_s32(int32_t __p0) { 18879 int32x4_t __ret; 18880 __ret = (int32x4_t) {__p0, __p0, __p0, __p0}; 18881 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 18882 return __ret; 18883 } 18884 #endif 18885 18886 #ifdef __LITTLE_ENDIAN__ 18887 __ai __attribute__((target("neon"))) int64x2_t vmovq_n_s64(int64_t __p0) { 18888 int64x2_t __ret; 18889 __ret = (int64x2_t) {__p0, __p0}; 18890 return __ret; 18891 } 18892 #else 18893 __ai __attribute__((target("neon"))) int64x2_t vmovq_n_s64(int64_t __p0) { 18894 int64x2_t __ret; 18895 __ret = (int64x2_t) {__p0, __p0}; 18896 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 18897 return __ret; 18898 } 18899 #endif 18900 18901 #ifdef __LITTLE_ENDIAN__ 18902 __ai __attribute__((target("neon"))) int16x8_t vmovq_n_s16(int16_t __p0) { 18903 int16x8_t __ret; 18904 __ret = (int16x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 18905 return __ret; 18906 } 18907 #else 18908 __ai __attribute__((target("neon"))) int16x8_t vmovq_n_s16(int16_t __p0) { 18909 int16x8_t __ret; 18910 __ret = (int16x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 18911 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 18912 return __ret; 18913 } 18914 #endif 18915 18916 #ifdef __LITTLE_ENDIAN__ 18917 __ai __attribute__((target("neon"))) uint8x8_t vmov_n_u8(uint8_t __p0) { 18918 uint8x8_t __ret; 18919 __ret = (uint8x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 18920 return __ret; 18921 } 18922 #else 18923 __ai __attribute__((target("neon"))) uint8x8_t vmov_n_u8(uint8_t __p0) { 18924 uint8x8_t __ret; 18925 __ret = (uint8x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 18926 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 18927 return __ret; 18928 } 18929 #endif 18930 18931 #ifdef __LITTLE_ENDIAN__ 18932 __ai __attribute__((target("neon"))) uint32x2_t vmov_n_u32(uint32_t __p0) { 18933 uint32x2_t __ret; 18934 __ret = (uint32x2_t) {__p0, __p0}; 18935 return __ret; 18936 } 18937 #else 18938 __ai __attribute__((target("neon"))) uint32x2_t vmov_n_u32(uint32_t __p0) { 18939 uint32x2_t __ret; 18940 __ret = (uint32x2_t) {__p0, __p0}; 18941 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 18942 return __ret; 18943 } 18944 #endif 18945 18946 __ai __attribute__((target("neon"))) uint64x1_t vmov_n_u64(uint64_t __p0) { 18947 uint64x1_t __ret; 18948 __ret = (uint64x1_t) {__p0}; 18949 return __ret; 18950 } 18951 #ifdef __LITTLE_ENDIAN__ 18952 __ai __attribute__((target("neon"))) uint16x4_t vmov_n_u16(uint16_t __p0) { 18953 uint16x4_t __ret; 18954 __ret = (uint16x4_t) {__p0, __p0, __p0, __p0}; 18955 return __ret; 18956 } 18957 #else 18958 __ai __attribute__((target("neon"))) uint16x4_t vmov_n_u16(uint16_t __p0) { 18959 uint16x4_t __ret; 18960 __ret = (uint16x4_t) {__p0, __p0, __p0, __p0}; 18961 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 18962 return __ret; 18963 } 18964 #endif 18965 18966 #ifdef __LITTLE_ENDIAN__ 18967 __ai __attribute__((target("neon"))) int8x8_t vmov_n_s8(int8_t __p0) { 18968 int8x8_t __ret; 18969 __ret = (int8x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 18970 return __ret; 18971 } 18972 #else 18973 __ai __attribute__((target("neon"))) int8x8_t vmov_n_s8(int8_t __p0) { 18974 int8x8_t __ret; 18975 __ret = (int8x8_t) {__p0, __p0, __p0, __p0, __p0, __p0, __p0, __p0}; 18976 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 18977 return __ret; 18978 } 18979 #endif 18980 18981 #ifdef __LITTLE_ENDIAN__ 18982 __ai __attribute__((target("neon"))) float32x2_t vmov_n_f32(float32_t __p0) { 18983 float32x2_t __ret; 18984 __ret = (float32x2_t) {__p0, __p0}; 18985 return __ret; 18986 } 18987 #else 18988 __ai __attribute__((target("neon"))) float32x2_t vmov_n_f32(float32_t __p0) { 18989 float32x2_t __ret; 18990 __ret = (float32x2_t) {__p0, __p0}; 18991 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 18992 return __ret; 18993 } 18994 #endif 18995 18996 #ifdef __LITTLE_ENDIAN__ 18997 #define vmov_n_f16(__p0) __extension__ ({ \ 18998 float16x4_t __ret; \ 18999 float16_t __s0 = __p0; \ 19000 __ret = (float16x4_t) {__s0, __s0, __s0, __s0}; \ 19001 __ret; \ 19002 }) 19003 #else 19004 #define vmov_n_f16(__p0) __extension__ ({ \ 19005 float16x4_t __ret; \ 19006 float16_t __s0 = __p0; \ 19007 __ret = (float16x4_t) {__s0, __s0, __s0, __s0}; \ 19008 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 19009 __ret; \ 19010 }) 19011 #endif 19012 19013 #ifdef __LITTLE_ENDIAN__ 19014 __ai __attribute__((target("neon"))) int32x2_t vmov_n_s32(int32_t __p0) { 19015 int32x2_t __ret; 19016 __ret = (int32x2_t) {__p0, __p0}; 19017 return __ret; 19018 } 19019 #else 19020 __ai __attribute__((target("neon"))) int32x2_t vmov_n_s32(int32_t __p0) { 19021 int32x2_t __ret; 19022 __ret = (int32x2_t) {__p0, __p0}; 19023 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 19024 return __ret; 19025 } 19026 #endif 19027 19028 __ai __attribute__((target("neon"))) int64x1_t vmov_n_s64(int64_t __p0) { 19029 int64x1_t __ret; 19030 __ret = (int64x1_t) {__p0}; 19031 return __ret; 19032 } 19033 #ifdef __LITTLE_ENDIAN__ 19034 __ai __attribute__((target("neon"))) int16x4_t vmov_n_s16(int16_t __p0) { 19035 int16x4_t __ret; 19036 __ret = (int16x4_t) {__p0, __p0, __p0, __p0}; 19037 return __ret; 19038 } 19039 #else 19040 __ai __attribute__((target("neon"))) int16x4_t vmov_n_s16(int16_t __p0) { 19041 int16x4_t __ret; 19042 __ret = (int16x4_t) {__p0, __p0, __p0, __p0}; 19043 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 19044 return __ret; 19045 } 19046 #endif 19047 19048 #ifdef __LITTLE_ENDIAN__ 19049 __ai __attribute__((target("neon"))) uint16x8_t vmovl_u8(uint8x8_t __p0) { 19050 uint16x8_t __ret; 19051 __ret = (uint16x8_t) __builtin_neon_vmovl_v((int8x8_t)__p0, 49); 19052 return __ret; 19053 } 19054 #else 19055 __ai __attribute__((target("neon"))) uint16x8_t vmovl_u8(uint8x8_t __p0) { 19056 uint16x8_t __ret; 19057 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 19058 __ret = (uint16x8_t) __builtin_neon_vmovl_v((int8x8_t)__rev0, 49); 19059 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 19060 return __ret; 19061 } 19062 __ai __attribute__((target("neon"))) uint16x8_t __noswap_vmovl_u8(uint8x8_t __p0) { 19063 uint16x8_t __ret; 19064 __ret = (uint16x8_t) __builtin_neon_vmovl_v((int8x8_t)__p0, 49); 19065 return __ret; 19066 } 19067 #endif 19068 19069 #ifdef __LITTLE_ENDIAN__ 19070 __ai __attribute__((target("neon"))) uint64x2_t vmovl_u32(uint32x2_t __p0) { 19071 uint64x2_t __ret; 19072 __ret = (uint64x2_t) __builtin_neon_vmovl_v((int8x8_t)__p0, 51); 19073 return __ret; 19074 } 19075 #else 19076 __ai __attribute__((target("neon"))) uint64x2_t vmovl_u32(uint32x2_t __p0) { 19077 uint64x2_t __ret; 19078 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 19079 __ret = (uint64x2_t) __builtin_neon_vmovl_v((int8x8_t)__rev0, 51); 19080 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 19081 return __ret; 19082 } 19083 __ai __attribute__((target("neon"))) uint64x2_t __noswap_vmovl_u32(uint32x2_t __p0) { 19084 uint64x2_t __ret; 19085 __ret = (uint64x2_t) __builtin_neon_vmovl_v((int8x8_t)__p0, 51); 19086 return __ret; 19087 } 19088 #endif 19089 19090 #ifdef __LITTLE_ENDIAN__ 19091 __ai __attribute__((target("neon"))) uint32x4_t vmovl_u16(uint16x4_t __p0) { 19092 uint32x4_t __ret; 19093 __ret = (uint32x4_t) __builtin_neon_vmovl_v((int8x8_t)__p0, 50); 19094 return __ret; 19095 } 19096 #else 19097 __ai __attribute__((target("neon"))) uint32x4_t vmovl_u16(uint16x4_t __p0) { 19098 uint32x4_t __ret; 19099 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 19100 __ret = (uint32x4_t) __builtin_neon_vmovl_v((int8x8_t)__rev0, 50); 19101 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 19102 return __ret; 19103 } 19104 __ai __attribute__((target("neon"))) uint32x4_t __noswap_vmovl_u16(uint16x4_t __p0) { 19105 uint32x4_t __ret; 19106 __ret = (uint32x4_t) __builtin_neon_vmovl_v((int8x8_t)__p0, 50); 19107 return __ret; 19108 } 19109 #endif 19110 19111 #ifdef __LITTLE_ENDIAN__ 19112 __ai __attribute__((target("neon"))) int16x8_t vmovl_s8(int8x8_t __p0) { 19113 int16x8_t __ret; 19114 __ret = (int16x8_t) __builtin_neon_vmovl_v((int8x8_t)__p0, 33); 19115 return __ret; 19116 } 19117 #else 19118 __ai __attribute__((target("neon"))) int16x8_t vmovl_s8(int8x8_t __p0) { 19119 int16x8_t __ret; 19120 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 19121 __ret = (int16x8_t) __builtin_neon_vmovl_v((int8x8_t)__rev0, 33); 19122 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 19123 return __ret; 19124 } 19125 __ai __attribute__((target("neon"))) int16x8_t __noswap_vmovl_s8(int8x8_t __p0) { 19126 int16x8_t __ret; 19127 __ret = (int16x8_t) __builtin_neon_vmovl_v((int8x8_t)__p0, 33); 19128 return __ret; 19129 } 19130 #endif 19131 19132 #ifdef __LITTLE_ENDIAN__ 19133 __ai __attribute__((target("neon"))) int64x2_t vmovl_s32(int32x2_t __p0) { 19134 int64x2_t __ret; 19135 __ret = (int64x2_t) __builtin_neon_vmovl_v((int8x8_t)__p0, 35); 19136 return __ret; 19137 } 19138 #else 19139 __ai __attribute__((target("neon"))) int64x2_t vmovl_s32(int32x2_t __p0) { 19140 int64x2_t __ret; 19141 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 19142 __ret = (int64x2_t) __builtin_neon_vmovl_v((int8x8_t)__rev0, 35); 19143 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 19144 return __ret; 19145 } 19146 __ai __attribute__((target("neon"))) int64x2_t __noswap_vmovl_s32(int32x2_t __p0) { 19147 int64x2_t __ret; 19148 __ret = (int64x2_t) __builtin_neon_vmovl_v((int8x8_t)__p0, 35); 19149 return __ret; 19150 } 19151 #endif 19152 19153 #ifdef __LITTLE_ENDIAN__ 19154 __ai __attribute__((target("neon"))) int32x4_t vmovl_s16(int16x4_t __p0) { 19155 int32x4_t __ret; 19156 __ret = (int32x4_t) __builtin_neon_vmovl_v((int8x8_t)__p0, 34); 19157 return __ret; 19158 } 19159 #else 19160 __ai __attribute__((target("neon"))) int32x4_t vmovl_s16(int16x4_t __p0) { 19161 int32x4_t __ret; 19162 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 19163 __ret = (int32x4_t) __builtin_neon_vmovl_v((int8x8_t)__rev0, 34); 19164 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 19165 return __ret; 19166 } 19167 __ai __attribute__((target("neon"))) int32x4_t __noswap_vmovl_s16(int16x4_t __p0) { 19168 int32x4_t __ret; 19169 __ret = (int32x4_t) __builtin_neon_vmovl_v((int8x8_t)__p0, 34); 19170 return __ret; 19171 } 19172 #endif 19173 19174 #ifdef __LITTLE_ENDIAN__ 19175 __ai __attribute__((target("neon"))) uint16x4_t vmovn_u32(uint32x4_t __p0) { 19176 uint16x4_t __ret; 19177 __ret = (uint16x4_t) __builtin_neon_vmovn_v((int8x16_t)__p0, 17); 19178 return __ret; 19179 } 19180 #else 19181 __ai __attribute__((target("neon"))) uint16x4_t vmovn_u32(uint32x4_t __p0) { 19182 uint16x4_t __ret; 19183 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 19184 __ret = (uint16x4_t) __builtin_neon_vmovn_v((int8x16_t)__rev0, 17); 19185 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 19186 return __ret; 19187 } 19188 __ai __attribute__((target("neon"))) uint16x4_t __noswap_vmovn_u32(uint32x4_t __p0) { 19189 uint16x4_t __ret; 19190 __ret = (uint16x4_t) __builtin_neon_vmovn_v((int8x16_t)__p0, 17); 19191 return __ret; 19192 } 19193 #endif 19194 19195 #ifdef __LITTLE_ENDIAN__ 19196 __ai __attribute__((target("neon"))) uint32x2_t vmovn_u64(uint64x2_t __p0) { 19197 uint32x2_t __ret; 19198 __ret = (uint32x2_t) __builtin_neon_vmovn_v((int8x16_t)__p0, 18); 19199 return __ret; 19200 } 19201 #else 19202 __ai __attribute__((target("neon"))) uint32x2_t vmovn_u64(uint64x2_t __p0) { 19203 uint32x2_t __ret; 19204 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 19205 __ret = (uint32x2_t) __builtin_neon_vmovn_v((int8x16_t)__rev0, 18); 19206 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 19207 return __ret; 19208 } 19209 __ai __attribute__((target("neon"))) uint32x2_t __noswap_vmovn_u64(uint64x2_t __p0) { 19210 uint32x2_t __ret; 19211 __ret = (uint32x2_t) __builtin_neon_vmovn_v((int8x16_t)__p0, 18); 19212 return __ret; 19213 } 19214 #endif 19215 19216 #ifdef __LITTLE_ENDIAN__ 19217 __ai __attribute__((target("neon"))) uint8x8_t vmovn_u16(uint16x8_t __p0) { 19218 uint8x8_t __ret; 19219 __ret = (uint8x8_t) __builtin_neon_vmovn_v((int8x16_t)__p0, 16); 19220 return __ret; 19221 } 19222 #else 19223 __ai __attribute__((target("neon"))) uint8x8_t vmovn_u16(uint16x8_t __p0) { 19224 uint8x8_t __ret; 19225 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 19226 __ret = (uint8x8_t) __builtin_neon_vmovn_v((int8x16_t)__rev0, 16); 19227 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 19228 return __ret; 19229 } 19230 __ai __attribute__((target("neon"))) uint8x8_t __noswap_vmovn_u16(uint16x8_t __p0) { 19231 uint8x8_t __ret; 19232 __ret = (uint8x8_t) __builtin_neon_vmovn_v((int8x16_t)__p0, 16); 19233 return __ret; 19234 } 19235 #endif 19236 19237 #ifdef __LITTLE_ENDIAN__ 19238 __ai __attribute__((target("neon"))) int16x4_t vmovn_s32(int32x4_t __p0) { 19239 int16x4_t __ret; 19240 __ret = (int16x4_t) __builtin_neon_vmovn_v((int8x16_t)__p0, 1); 19241 return __ret; 19242 } 19243 #else 19244 __ai __attribute__((target("neon"))) int16x4_t vmovn_s32(int32x4_t __p0) { 19245 int16x4_t __ret; 19246 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 19247 __ret = (int16x4_t) __builtin_neon_vmovn_v((int8x16_t)__rev0, 1); 19248 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 19249 return __ret; 19250 } 19251 __ai __attribute__((target("neon"))) int16x4_t __noswap_vmovn_s32(int32x4_t __p0) { 19252 int16x4_t __ret; 19253 __ret = (int16x4_t) __builtin_neon_vmovn_v((int8x16_t)__p0, 1); 19254 return __ret; 19255 } 19256 #endif 19257 19258 #ifdef __LITTLE_ENDIAN__ 19259 __ai __attribute__((target("neon"))) int32x2_t vmovn_s64(int64x2_t __p0) { 19260 int32x2_t __ret; 19261 __ret = (int32x2_t) __builtin_neon_vmovn_v((int8x16_t)__p0, 2); 19262 return __ret; 19263 } 19264 #else 19265 __ai __attribute__((target("neon"))) int32x2_t vmovn_s64(int64x2_t __p0) { 19266 int32x2_t __ret; 19267 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 19268 __ret = (int32x2_t) __builtin_neon_vmovn_v((int8x16_t)__rev0, 2); 19269 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 19270 return __ret; 19271 } 19272 __ai __attribute__((target("neon"))) int32x2_t __noswap_vmovn_s64(int64x2_t __p0) { 19273 int32x2_t __ret; 19274 __ret = (int32x2_t) __builtin_neon_vmovn_v((int8x16_t)__p0, 2); 19275 return __ret; 19276 } 19277 #endif 19278 19279 #ifdef __LITTLE_ENDIAN__ 19280 __ai __attribute__((target("neon"))) int8x8_t vmovn_s16(int16x8_t __p0) { 19281 int8x8_t __ret; 19282 __ret = (int8x8_t) __builtin_neon_vmovn_v((int8x16_t)__p0, 0); 19283 return __ret; 19284 } 19285 #else 19286 __ai __attribute__((target("neon"))) int8x8_t vmovn_s16(int16x8_t __p0) { 19287 int8x8_t __ret; 19288 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 19289 __ret = (int8x8_t) __builtin_neon_vmovn_v((int8x16_t)__rev0, 0); 19290 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 19291 return __ret; 19292 } 19293 __ai __attribute__((target("neon"))) int8x8_t __noswap_vmovn_s16(int16x8_t __p0) { 19294 int8x8_t __ret; 19295 __ret = (int8x8_t) __builtin_neon_vmovn_v((int8x16_t)__p0, 0); 19296 return __ret; 19297 } 19298 #endif 19299 19300 #ifdef __LITTLE_ENDIAN__ 19301 __ai __attribute__((target("neon"))) uint8x16_t vmulq_u8(uint8x16_t __p0, uint8x16_t __p1) { 19302 uint8x16_t __ret; 19303 __ret = __p0 * __p1; 19304 return __ret; 19305 } 19306 #else 19307 __ai __attribute__((target("neon"))) uint8x16_t vmulq_u8(uint8x16_t __p0, uint8x16_t __p1) { 19308 uint8x16_t __ret; 19309 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 19310 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 19311 __ret = __rev0 * __rev1; 19312 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 19313 return __ret; 19314 } 19315 #endif 19316 19317 #ifdef __LITTLE_ENDIAN__ 19318 __ai __attribute__((target("neon"))) uint32x4_t vmulq_u32(uint32x4_t __p0, uint32x4_t __p1) { 19319 uint32x4_t __ret; 19320 __ret = __p0 * __p1; 19321 return __ret; 19322 } 19323 #else 19324 __ai __attribute__((target("neon"))) uint32x4_t vmulq_u32(uint32x4_t __p0, uint32x4_t __p1) { 19325 uint32x4_t __ret; 19326 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 19327 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 19328 __ret = __rev0 * __rev1; 19329 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 19330 return __ret; 19331 } 19332 #endif 19333 19334 #ifdef __LITTLE_ENDIAN__ 19335 __ai __attribute__((target("neon"))) uint16x8_t vmulq_u16(uint16x8_t __p0, uint16x8_t __p1) { 19336 uint16x8_t __ret; 19337 __ret = __p0 * __p1; 19338 return __ret; 19339 } 19340 #else 19341 __ai __attribute__((target("neon"))) uint16x8_t vmulq_u16(uint16x8_t __p0, uint16x8_t __p1) { 19342 uint16x8_t __ret; 19343 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 19344 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 19345 __ret = __rev0 * __rev1; 19346 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 19347 return __ret; 19348 } 19349 #endif 19350 19351 #ifdef __LITTLE_ENDIAN__ 19352 __ai __attribute__((target("neon"))) int8x16_t vmulq_s8(int8x16_t __p0, int8x16_t __p1) { 19353 int8x16_t __ret; 19354 __ret = __p0 * __p1; 19355 return __ret; 19356 } 19357 #else 19358 __ai __attribute__((target("neon"))) int8x16_t vmulq_s8(int8x16_t __p0, int8x16_t __p1) { 19359 int8x16_t __ret; 19360 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 19361 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 19362 __ret = __rev0 * __rev1; 19363 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 19364 return __ret; 19365 } 19366 #endif 19367 19368 #ifdef __LITTLE_ENDIAN__ 19369 __ai __attribute__((target("neon"))) float32x4_t vmulq_f32(float32x4_t __p0, float32x4_t __p1) { 19370 float32x4_t __ret; 19371 __ret = __p0 * __p1; 19372 return __ret; 19373 } 19374 #else 19375 __ai __attribute__((target("neon"))) float32x4_t vmulq_f32(float32x4_t __p0, float32x4_t __p1) { 19376 float32x4_t __ret; 19377 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 19378 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 19379 __ret = __rev0 * __rev1; 19380 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 19381 return __ret; 19382 } 19383 #endif 19384 19385 #ifdef __LITTLE_ENDIAN__ 19386 __ai __attribute__((target("neon"))) int32x4_t vmulq_s32(int32x4_t __p0, int32x4_t __p1) { 19387 int32x4_t __ret; 19388 __ret = __p0 * __p1; 19389 return __ret; 19390 } 19391 #else 19392 __ai __attribute__((target("neon"))) int32x4_t vmulq_s32(int32x4_t __p0, int32x4_t __p1) { 19393 int32x4_t __ret; 19394 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 19395 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 19396 __ret = __rev0 * __rev1; 19397 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 19398 return __ret; 19399 } 19400 #endif 19401 19402 #ifdef __LITTLE_ENDIAN__ 19403 __ai __attribute__((target("neon"))) int16x8_t vmulq_s16(int16x8_t __p0, int16x8_t __p1) { 19404 int16x8_t __ret; 19405 __ret = __p0 * __p1; 19406 return __ret; 19407 } 19408 #else 19409 __ai __attribute__((target("neon"))) int16x8_t vmulq_s16(int16x8_t __p0, int16x8_t __p1) { 19410 int16x8_t __ret; 19411 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 19412 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 19413 __ret = __rev0 * __rev1; 19414 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 19415 return __ret; 19416 } 19417 #endif 19418 19419 #ifdef __LITTLE_ENDIAN__ 19420 __ai __attribute__((target("neon"))) uint8x8_t vmul_u8(uint8x8_t __p0, uint8x8_t __p1) { 19421 uint8x8_t __ret; 19422 __ret = __p0 * __p1; 19423 return __ret; 19424 } 19425 #else 19426 __ai __attribute__((target("neon"))) uint8x8_t vmul_u8(uint8x8_t __p0, uint8x8_t __p1) { 19427 uint8x8_t __ret; 19428 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 19429 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 19430 __ret = __rev0 * __rev1; 19431 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 19432 return __ret; 19433 } 19434 #endif 19435 19436 #ifdef __LITTLE_ENDIAN__ 19437 __ai __attribute__((target("neon"))) uint32x2_t vmul_u32(uint32x2_t __p0, uint32x2_t __p1) { 19438 uint32x2_t __ret; 19439 __ret = __p0 * __p1; 19440 return __ret; 19441 } 19442 #else 19443 __ai __attribute__((target("neon"))) uint32x2_t vmul_u32(uint32x2_t __p0, uint32x2_t __p1) { 19444 uint32x2_t __ret; 19445 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 19446 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 19447 __ret = __rev0 * __rev1; 19448 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 19449 return __ret; 19450 } 19451 #endif 19452 19453 #ifdef __LITTLE_ENDIAN__ 19454 __ai __attribute__((target("neon"))) uint16x4_t vmul_u16(uint16x4_t __p0, uint16x4_t __p1) { 19455 uint16x4_t __ret; 19456 __ret = __p0 * __p1; 19457 return __ret; 19458 } 19459 #else 19460 __ai __attribute__((target("neon"))) uint16x4_t vmul_u16(uint16x4_t __p0, uint16x4_t __p1) { 19461 uint16x4_t __ret; 19462 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 19463 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 19464 __ret = __rev0 * __rev1; 19465 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 19466 return __ret; 19467 } 19468 #endif 19469 19470 #ifdef __LITTLE_ENDIAN__ 19471 __ai __attribute__((target("neon"))) int8x8_t vmul_s8(int8x8_t __p0, int8x8_t __p1) { 19472 int8x8_t __ret; 19473 __ret = __p0 * __p1; 19474 return __ret; 19475 } 19476 #else 19477 __ai __attribute__((target("neon"))) int8x8_t vmul_s8(int8x8_t __p0, int8x8_t __p1) { 19478 int8x8_t __ret; 19479 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 19480 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 19481 __ret = __rev0 * __rev1; 19482 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 19483 return __ret; 19484 } 19485 #endif 19486 19487 #ifdef __LITTLE_ENDIAN__ 19488 __ai __attribute__((target("neon"))) float32x2_t vmul_f32(float32x2_t __p0, float32x2_t __p1) { 19489 float32x2_t __ret; 19490 __ret = __p0 * __p1; 19491 return __ret; 19492 } 19493 #else 19494 __ai __attribute__((target("neon"))) float32x2_t vmul_f32(float32x2_t __p0, float32x2_t __p1) { 19495 float32x2_t __ret; 19496 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 19497 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 19498 __ret = __rev0 * __rev1; 19499 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 19500 return __ret; 19501 } 19502 #endif 19503 19504 #ifdef __LITTLE_ENDIAN__ 19505 __ai __attribute__((target("neon"))) int32x2_t vmul_s32(int32x2_t __p0, int32x2_t __p1) { 19506 int32x2_t __ret; 19507 __ret = __p0 * __p1; 19508 return __ret; 19509 } 19510 #else 19511 __ai __attribute__((target("neon"))) int32x2_t vmul_s32(int32x2_t __p0, int32x2_t __p1) { 19512 int32x2_t __ret; 19513 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 19514 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 19515 __ret = __rev0 * __rev1; 19516 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 19517 return __ret; 19518 } 19519 #endif 19520 19521 #ifdef __LITTLE_ENDIAN__ 19522 __ai __attribute__((target("neon"))) int16x4_t vmul_s16(int16x4_t __p0, int16x4_t __p1) { 19523 int16x4_t __ret; 19524 __ret = __p0 * __p1; 19525 return __ret; 19526 } 19527 #else 19528 __ai __attribute__((target("neon"))) int16x4_t vmul_s16(int16x4_t __p0, int16x4_t __p1) { 19529 int16x4_t __ret; 19530 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 19531 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 19532 __ret = __rev0 * __rev1; 19533 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 19534 return __ret; 19535 } 19536 #endif 19537 19538 #ifdef __LITTLE_ENDIAN__ 19539 __ai __attribute__((target("neon"))) poly8x8_t vmul_p8(poly8x8_t __p0, poly8x8_t __p1) { 19540 poly8x8_t __ret; 19541 __ret = (poly8x8_t) __builtin_neon_vmul_v((int8x8_t)__p0, (int8x8_t)__p1, 4); 19542 return __ret; 19543 } 19544 #else 19545 __ai __attribute__((target("neon"))) poly8x8_t vmul_p8(poly8x8_t __p0, poly8x8_t __p1) { 19546 poly8x8_t __ret; 19547 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 19548 poly8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 19549 __ret = (poly8x8_t) __builtin_neon_vmul_v((int8x8_t)__rev0, (int8x8_t)__rev1, 4); 19550 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 19551 return __ret; 19552 } 19553 #endif 19554 19555 #ifdef __LITTLE_ENDIAN__ 19556 __ai __attribute__((target("neon"))) poly8x16_t vmulq_p8(poly8x16_t __p0, poly8x16_t __p1) { 19557 poly8x16_t __ret; 19558 __ret = (poly8x16_t) __builtin_neon_vmulq_v((int8x16_t)__p0, (int8x16_t)__p1, 36); 19559 return __ret; 19560 } 19561 #else 19562 __ai __attribute__((target("neon"))) poly8x16_t vmulq_p8(poly8x16_t __p0, poly8x16_t __p1) { 19563 poly8x16_t __ret; 19564 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 19565 poly8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 19566 __ret = (poly8x16_t) __builtin_neon_vmulq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 36); 19567 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 19568 return __ret; 19569 } 19570 #endif 19571 19572 #ifdef __LITTLE_ENDIAN__ 19573 #define vmulq_lane_u32(__p0_94, __p1_94, __p2_94) __extension__ ({ \ 19574 uint32x4_t __ret_94; \ 19575 uint32x4_t __s0_94 = __p0_94; \ 19576 uint32x2_t __s1_94 = __p1_94; \ 19577 __ret_94 = __s0_94 * splatq_lane_u32(__s1_94, __p2_94); \ 19578 __ret_94; \ 19579 }) 19580 #else 19581 #define vmulq_lane_u32(__p0_95, __p1_95, __p2_95) __extension__ ({ \ 19582 uint32x4_t __ret_95; \ 19583 uint32x4_t __s0_95 = __p0_95; \ 19584 uint32x2_t __s1_95 = __p1_95; \ 19585 uint32x4_t __rev0_95; __rev0_95 = __builtin_shufflevector(__s0_95, __s0_95, 3, 2, 1, 0); \ 19586 uint32x2_t __rev1_95; __rev1_95 = __builtin_shufflevector(__s1_95, __s1_95, 1, 0); \ 19587 __ret_95 = __rev0_95 * __noswap_splatq_lane_u32(__rev1_95, __p2_95); \ 19588 __ret_95 = __builtin_shufflevector(__ret_95, __ret_95, 3, 2, 1, 0); \ 19589 __ret_95; \ 19590 }) 19591 #endif 19592 19593 #ifdef __LITTLE_ENDIAN__ 19594 #define vmulq_lane_u16(__p0_96, __p1_96, __p2_96) __extension__ ({ \ 19595 uint16x8_t __ret_96; \ 19596 uint16x8_t __s0_96 = __p0_96; \ 19597 uint16x4_t __s1_96 = __p1_96; \ 19598 __ret_96 = __s0_96 * splatq_lane_u16(__s1_96, __p2_96); \ 19599 __ret_96; \ 19600 }) 19601 #else 19602 #define vmulq_lane_u16(__p0_97, __p1_97, __p2_97) __extension__ ({ \ 19603 uint16x8_t __ret_97; \ 19604 uint16x8_t __s0_97 = __p0_97; \ 19605 uint16x4_t __s1_97 = __p1_97; \ 19606 uint16x8_t __rev0_97; __rev0_97 = __builtin_shufflevector(__s0_97, __s0_97, 7, 6, 5, 4, 3, 2, 1, 0); \ 19607 uint16x4_t __rev1_97; __rev1_97 = __builtin_shufflevector(__s1_97, __s1_97, 3, 2, 1, 0); \ 19608 __ret_97 = __rev0_97 * __noswap_splatq_lane_u16(__rev1_97, __p2_97); \ 19609 __ret_97 = __builtin_shufflevector(__ret_97, __ret_97, 7, 6, 5, 4, 3, 2, 1, 0); \ 19610 __ret_97; \ 19611 }) 19612 #endif 19613 19614 #ifdef __LITTLE_ENDIAN__ 19615 #define vmulq_lane_f32(__p0_98, __p1_98, __p2_98) __extension__ ({ \ 19616 float32x4_t __ret_98; \ 19617 float32x4_t __s0_98 = __p0_98; \ 19618 float32x2_t __s1_98 = __p1_98; \ 19619 __ret_98 = __s0_98 * splatq_lane_f32(__s1_98, __p2_98); \ 19620 __ret_98; \ 19621 }) 19622 #else 19623 #define vmulq_lane_f32(__p0_99, __p1_99, __p2_99) __extension__ ({ \ 19624 float32x4_t __ret_99; \ 19625 float32x4_t __s0_99 = __p0_99; \ 19626 float32x2_t __s1_99 = __p1_99; \ 19627 float32x4_t __rev0_99; __rev0_99 = __builtin_shufflevector(__s0_99, __s0_99, 3, 2, 1, 0); \ 19628 float32x2_t __rev1_99; __rev1_99 = __builtin_shufflevector(__s1_99, __s1_99, 1, 0); \ 19629 __ret_99 = __rev0_99 * __noswap_splatq_lane_f32(__rev1_99, __p2_99); \ 19630 __ret_99 = __builtin_shufflevector(__ret_99, __ret_99, 3, 2, 1, 0); \ 19631 __ret_99; \ 19632 }) 19633 #endif 19634 19635 #ifdef __LITTLE_ENDIAN__ 19636 #define vmulq_lane_s32(__p0_100, __p1_100, __p2_100) __extension__ ({ \ 19637 int32x4_t __ret_100; \ 19638 int32x4_t __s0_100 = __p0_100; \ 19639 int32x2_t __s1_100 = __p1_100; \ 19640 __ret_100 = __s0_100 * splatq_lane_s32(__s1_100, __p2_100); \ 19641 __ret_100; \ 19642 }) 19643 #else 19644 #define vmulq_lane_s32(__p0_101, __p1_101, __p2_101) __extension__ ({ \ 19645 int32x4_t __ret_101; \ 19646 int32x4_t __s0_101 = __p0_101; \ 19647 int32x2_t __s1_101 = __p1_101; \ 19648 int32x4_t __rev0_101; __rev0_101 = __builtin_shufflevector(__s0_101, __s0_101, 3, 2, 1, 0); \ 19649 int32x2_t __rev1_101; __rev1_101 = __builtin_shufflevector(__s1_101, __s1_101, 1, 0); \ 19650 __ret_101 = __rev0_101 * __noswap_splatq_lane_s32(__rev1_101, __p2_101); \ 19651 __ret_101 = __builtin_shufflevector(__ret_101, __ret_101, 3, 2, 1, 0); \ 19652 __ret_101; \ 19653 }) 19654 #endif 19655 19656 #ifdef __LITTLE_ENDIAN__ 19657 #define vmulq_lane_s16(__p0_102, __p1_102, __p2_102) __extension__ ({ \ 19658 int16x8_t __ret_102; \ 19659 int16x8_t __s0_102 = __p0_102; \ 19660 int16x4_t __s1_102 = __p1_102; \ 19661 __ret_102 = __s0_102 * splatq_lane_s16(__s1_102, __p2_102); \ 19662 __ret_102; \ 19663 }) 19664 #else 19665 #define vmulq_lane_s16(__p0_103, __p1_103, __p2_103) __extension__ ({ \ 19666 int16x8_t __ret_103; \ 19667 int16x8_t __s0_103 = __p0_103; \ 19668 int16x4_t __s1_103 = __p1_103; \ 19669 int16x8_t __rev0_103; __rev0_103 = __builtin_shufflevector(__s0_103, __s0_103, 7, 6, 5, 4, 3, 2, 1, 0); \ 19670 int16x4_t __rev1_103; __rev1_103 = __builtin_shufflevector(__s1_103, __s1_103, 3, 2, 1, 0); \ 19671 __ret_103 = __rev0_103 * __noswap_splatq_lane_s16(__rev1_103, __p2_103); \ 19672 __ret_103 = __builtin_shufflevector(__ret_103, __ret_103, 7, 6, 5, 4, 3, 2, 1, 0); \ 19673 __ret_103; \ 19674 }) 19675 #endif 19676 19677 #ifdef __LITTLE_ENDIAN__ 19678 #define vmul_lane_u32(__p0_104, __p1_104, __p2_104) __extension__ ({ \ 19679 uint32x2_t __ret_104; \ 19680 uint32x2_t __s0_104 = __p0_104; \ 19681 uint32x2_t __s1_104 = __p1_104; \ 19682 __ret_104 = __s0_104 * splat_lane_u32(__s1_104, __p2_104); \ 19683 __ret_104; \ 19684 }) 19685 #else 19686 #define vmul_lane_u32(__p0_105, __p1_105, __p2_105) __extension__ ({ \ 19687 uint32x2_t __ret_105; \ 19688 uint32x2_t __s0_105 = __p0_105; \ 19689 uint32x2_t __s1_105 = __p1_105; \ 19690 uint32x2_t __rev0_105; __rev0_105 = __builtin_shufflevector(__s0_105, __s0_105, 1, 0); \ 19691 uint32x2_t __rev1_105; __rev1_105 = __builtin_shufflevector(__s1_105, __s1_105, 1, 0); \ 19692 __ret_105 = __rev0_105 * __noswap_splat_lane_u32(__rev1_105, __p2_105); \ 19693 __ret_105 = __builtin_shufflevector(__ret_105, __ret_105, 1, 0); \ 19694 __ret_105; \ 19695 }) 19696 #endif 19697 19698 #ifdef __LITTLE_ENDIAN__ 19699 #define vmul_lane_u16(__p0_106, __p1_106, __p2_106) __extension__ ({ \ 19700 uint16x4_t __ret_106; \ 19701 uint16x4_t __s0_106 = __p0_106; \ 19702 uint16x4_t __s1_106 = __p1_106; \ 19703 __ret_106 = __s0_106 * splat_lane_u16(__s1_106, __p2_106); \ 19704 __ret_106; \ 19705 }) 19706 #else 19707 #define vmul_lane_u16(__p0_107, __p1_107, __p2_107) __extension__ ({ \ 19708 uint16x4_t __ret_107; \ 19709 uint16x4_t __s0_107 = __p0_107; \ 19710 uint16x4_t __s1_107 = __p1_107; \ 19711 uint16x4_t __rev0_107; __rev0_107 = __builtin_shufflevector(__s0_107, __s0_107, 3, 2, 1, 0); \ 19712 uint16x4_t __rev1_107; __rev1_107 = __builtin_shufflevector(__s1_107, __s1_107, 3, 2, 1, 0); \ 19713 __ret_107 = __rev0_107 * __noswap_splat_lane_u16(__rev1_107, __p2_107); \ 19714 __ret_107 = __builtin_shufflevector(__ret_107, __ret_107, 3, 2, 1, 0); \ 19715 __ret_107; \ 19716 }) 19717 #endif 19718 19719 #ifdef __LITTLE_ENDIAN__ 19720 #define vmul_lane_f32(__p0_108, __p1_108, __p2_108) __extension__ ({ \ 19721 float32x2_t __ret_108; \ 19722 float32x2_t __s0_108 = __p0_108; \ 19723 float32x2_t __s1_108 = __p1_108; \ 19724 __ret_108 = __s0_108 * splat_lane_f32(__s1_108, __p2_108); \ 19725 __ret_108; \ 19726 }) 19727 #else 19728 #define vmul_lane_f32(__p0_109, __p1_109, __p2_109) __extension__ ({ \ 19729 float32x2_t __ret_109; \ 19730 float32x2_t __s0_109 = __p0_109; \ 19731 float32x2_t __s1_109 = __p1_109; \ 19732 float32x2_t __rev0_109; __rev0_109 = __builtin_shufflevector(__s0_109, __s0_109, 1, 0); \ 19733 float32x2_t __rev1_109; __rev1_109 = __builtin_shufflevector(__s1_109, __s1_109, 1, 0); \ 19734 __ret_109 = __rev0_109 * __noswap_splat_lane_f32(__rev1_109, __p2_109); \ 19735 __ret_109 = __builtin_shufflevector(__ret_109, __ret_109, 1, 0); \ 19736 __ret_109; \ 19737 }) 19738 #endif 19739 19740 #ifdef __LITTLE_ENDIAN__ 19741 #define vmul_lane_s32(__p0_110, __p1_110, __p2_110) __extension__ ({ \ 19742 int32x2_t __ret_110; \ 19743 int32x2_t __s0_110 = __p0_110; \ 19744 int32x2_t __s1_110 = __p1_110; \ 19745 __ret_110 = __s0_110 * splat_lane_s32(__s1_110, __p2_110); \ 19746 __ret_110; \ 19747 }) 19748 #else 19749 #define vmul_lane_s32(__p0_111, __p1_111, __p2_111) __extension__ ({ \ 19750 int32x2_t __ret_111; \ 19751 int32x2_t __s0_111 = __p0_111; \ 19752 int32x2_t __s1_111 = __p1_111; \ 19753 int32x2_t __rev0_111; __rev0_111 = __builtin_shufflevector(__s0_111, __s0_111, 1, 0); \ 19754 int32x2_t __rev1_111; __rev1_111 = __builtin_shufflevector(__s1_111, __s1_111, 1, 0); \ 19755 __ret_111 = __rev0_111 * __noswap_splat_lane_s32(__rev1_111, __p2_111); \ 19756 __ret_111 = __builtin_shufflevector(__ret_111, __ret_111, 1, 0); \ 19757 __ret_111; \ 19758 }) 19759 #endif 19760 19761 #ifdef __LITTLE_ENDIAN__ 19762 #define vmul_lane_s16(__p0_112, __p1_112, __p2_112) __extension__ ({ \ 19763 int16x4_t __ret_112; \ 19764 int16x4_t __s0_112 = __p0_112; \ 19765 int16x4_t __s1_112 = __p1_112; \ 19766 __ret_112 = __s0_112 * splat_lane_s16(__s1_112, __p2_112); \ 19767 __ret_112; \ 19768 }) 19769 #else 19770 #define vmul_lane_s16(__p0_113, __p1_113, __p2_113) __extension__ ({ \ 19771 int16x4_t __ret_113; \ 19772 int16x4_t __s0_113 = __p0_113; \ 19773 int16x4_t __s1_113 = __p1_113; \ 19774 int16x4_t __rev0_113; __rev0_113 = __builtin_shufflevector(__s0_113, __s0_113, 3, 2, 1, 0); \ 19775 int16x4_t __rev1_113; __rev1_113 = __builtin_shufflevector(__s1_113, __s1_113, 3, 2, 1, 0); \ 19776 __ret_113 = __rev0_113 * __noswap_splat_lane_s16(__rev1_113, __p2_113); \ 19777 __ret_113 = __builtin_shufflevector(__ret_113, __ret_113, 3, 2, 1, 0); \ 19778 __ret_113; \ 19779 }) 19780 #endif 19781 19782 #ifdef __LITTLE_ENDIAN__ 19783 __ai __attribute__((target("neon"))) uint32x4_t vmulq_n_u32(uint32x4_t __p0, uint32_t __p1) { 19784 uint32x4_t __ret; 19785 __ret = __p0 * (uint32x4_t) {__p1, __p1, __p1, __p1}; 19786 return __ret; 19787 } 19788 #else 19789 __ai __attribute__((target("neon"))) uint32x4_t vmulq_n_u32(uint32x4_t __p0, uint32_t __p1) { 19790 uint32x4_t __ret; 19791 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 19792 __ret = __rev0 * (uint32x4_t) {__p1, __p1, __p1, __p1}; 19793 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 19794 return __ret; 19795 } 19796 #endif 19797 19798 #ifdef __LITTLE_ENDIAN__ 19799 __ai __attribute__((target("neon"))) uint16x8_t vmulq_n_u16(uint16x8_t __p0, uint16_t __p1) { 19800 uint16x8_t __ret; 19801 __ret = __p0 * (uint16x8_t) {__p1, __p1, __p1, __p1, __p1, __p1, __p1, __p1}; 19802 return __ret; 19803 } 19804 #else 19805 __ai __attribute__((target("neon"))) uint16x8_t vmulq_n_u16(uint16x8_t __p0, uint16_t __p1) { 19806 uint16x8_t __ret; 19807 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 19808 __ret = __rev0 * (uint16x8_t) {__p1, __p1, __p1, __p1, __p1, __p1, __p1, __p1}; 19809 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 19810 return __ret; 19811 } 19812 #endif 19813 19814 #ifdef __LITTLE_ENDIAN__ 19815 __ai __attribute__((target("neon"))) float32x4_t vmulq_n_f32(float32x4_t __p0, float32_t __p1) { 19816 float32x4_t __ret; 19817 __ret = __p0 * (float32x4_t) {__p1, __p1, __p1, __p1}; 19818 return __ret; 19819 } 19820 #else 19821 __ai __attribute__((target("neon"))) float32x4_t vmulq_n_f32(float32x4_t __p0, float32_t __p1) { 19822 float32x4_t __ret; 19823 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 19824 __ret = __rev0 * (float32x4_t) {__p1, __p1, __p1, __p1}; 19825 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 19826 return __ret; 19827 } 19828 #endif 19829 19830 #ifdef __LITTLE_ENDIAN__ 19831 __ai __attribute__((target("neon"))) int32x4_t vmulq_n_s32(int32x4_t __p0, int32_t __p1) { 19832 int32x4_t __ret; 19833 __ret = __p0 * (int32x4_t) {__p1, __p1, __p1, __p1}; 19834 return __ret; 19835 } 19836 #else 19837 __ai __attribute__((target("neon"))) int32x4_t vmulq_n_s32(int32x4_t __p0, int32_t __p1) { 19838 int32x4_t __ret; 19839 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 19840 __ret = __rev0 * (int32x4_t) {__p1, __p1, __p1, __p1}; 19841 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 19842 return __ret; 19843 } 19844 #endif 19845 19846 #ifdef __LITTLE_ENDIAN__ 19847 __ai __attribute__((target("neon"))) int16x8_t vmulq_n_s16(int16x8_t __p0, int16_t __p1) { 19848 int16x8_t __ret; 19849 __ret = __p0 * (int16x8_t) {__p1, __p1, __p1, __p1, __p1, __p1, __p1, __p1}; 19850 return __ret; 19851 } 19852 #else 19853 __ai __attribute__((target("neon"))) int16x8_t vmulq_n_s16(int16x8_t __p0, int16_t __p1) { 19854 int16x8_t __ret; 19855 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 19856 __ret = __rev0 * (int16x8_t) {__p1, __p1, __p1, __p1, __p1, __p1, __p1, __p1}; 19857 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 19858 return __ret; 19859 } 19860 #endif 19861 19862 #ifdef __LITTLE_ENDIAN__ 19863 __ai __attribute__((target("neon"))) uint32x2_t vmul_n_u32(uint32x2_t __p0, uint32_t __p1) { 19864 uint32x2_t __ret; 19865 __ret = __p0 * (uint32x2_t) {__p1, __p1}; 19866 return __ret; 19867 } 19868 #else 19869 __ai __attribute__((target("neon"))) uint32x2_t vmul_n_u32(uint32x2_t __p0, uint32_t __p1) { 19870 uint32x2_t __ret; 19871 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 19872 __ret = __rev0 * (uint32x2_t) {__p1, __p1}; 19873 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 19874 return __ret; 19875 } 19876 #endif 19877 19878 #ifdef __LITTLE_ENDIAN__ 19879 __ai __attribute__((target("neon"))) uint16x4_t vmul_n_u16(uint16x4_t __p0, uint16_t __p1) { 19880 uint16x4_t __ret; 19881 __ret = __p0 * (uint16x4_t) {__p1, __p1, __p1, __p1}; 19882 return __ret; 19883 } 19884 #else 19885 __ai __attribute__((target("neon"))) uint16x4_t vmul_n_u16(uint16x4_t __p0, uint16_t __p1) { 19886 uint16x4_t __ret; 19887 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 19888 __ret = __rev0 * (uint16x4_t) {__p1, __p1, __p1, __p1}; 19889 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 19890 return __ret; 19891 } 19892 #endif 19893 19894 #ifdef __LITTLE_ENDIAN__ 19895 __ai __attribute__((target("neon"))) float32x2_t vmul_n_f32(float32x2_t __p0, float32_t __p1) { 19896 float32x2_t __ret; 19897 __ret = __p0 * (float32x2_t) {__p1, __p1}; 19898 return __ret; 19899 } 19900 #else 19901 __ai __attribute__((target("neon"))) float32x2_t vmul_n_f32(float32x2_t __p0, float32_t __p1) { 19902 float32x2_t __ret; 19903 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 19904 __ret = __rev0 * (float32x2_t) {__p1, __p1}; 19905 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 19906 return __ret; 19907 } 19908 #endif 19909 19910 #ifdef __LITTLE_ENDIAN__ 19911 __ai __attribute__((target("neon"))) int32x2_t vmul_n_s32(int32x2_t __p0, int32_t __p1) { 19912 int32x2_t __ret; 19913 __ret = __p0 * (int32x2_t) {__p1, __p1}; 19914 return __ret; 19915 } 19916 #else 19917 __ai __attribute__((target("neon"))) int32x2_t vmul_n_s32(int32x2_t __p0, int32_t __p1) { 19918 int32x2_t __ret; 19919 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 19920 __ret = __rev0 * (int32x2_t) {__p1, __p1}; 19921 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 19922 return __ret; 19923 } 19924 #endif 19925 19926 #ifdef __LITTLE_ENDIAN__ 19927 __ai __attribute__((target("neon"))) int16x4_t vmul_n_s16(int16x4_t __p0, int16_t __p1) { 19928 int16x4_t __ret; 19929 __ret = __p0 * (int16x4_t) {__p1, __p1, __p1, __p1}; 19930 return __ret; 19931 } 19932 #else 19933 __ai __attribute__((target("neon"))) int16x4_t vmul_n_s16(int16x4_t __p0, int16_t __p1) { 19934 int16x4_t __ret; 19935 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 19936 __ret = __rev0 * (int16x4_t) {__p1, __p1, __p1, __p1}; 19937 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 19938 return __ret; 19939 } 19940 #endif 19941 19942 #ifdef __LITTLE_ENDIAN__ 19943 __ai __attribute__((target("neon"))) poly16x8_t vmull_p8(poly8x8_t __p0, poly8x8_t __p1) { 19944 poly16x8_t __ret; 19945 __ret = (poly16x8_t) __builtin_neon_vmull_v((int8x8_t)__p0, (int8x8_t)__p1, 37); 19946 return __ret; 19947 } 19948 #else 19949 __ai __attribute__((target("neon"))) poly16x8_t vmull_p8(poly8x8_t __p0, poly8x8_t __p1) { 19950 poly16x8_t __ret; 19951 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 19952 poly8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 19953 __ret = (poly16x8_t) __builtin_neon_vmull_v((int8x8_t)__rev0, (int8x8_t)__rev1, 37); 19954 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 19955 return __ret; 19956 } 19957 __ai __attribute__((target("neon"))) poly16x8_t __noswap_vmull_p8(poly8x8_t __p0, poly8x8_t __p1) { 19958 poly16x8_t __ret; 19959 __ret = (poly16x8_t) __builtin_neon_vmull_v((int8x8_t)__p0, (int8x8_t)__p1, 37); 19960 return __ret; 19961 } 19962 #endif 19963 19964 #ifdef __LITTLE_ENDIAN__ 19965 __ai __attribute__((target("neon"))) uint16x8_t vmull_u8(uint8x8_t __p0, uint8x8_t __p1) { 19966 uint16x8_t __ret; 19967 __ret = (uint16x8_t) __builtin_neon_vmull_v((int8x8_t)__p0, (int8x8_t)__p1, 49); 19968 return __ret; 19969 } 19970 #else 19971 __ai __attribute__((target("neon"))) uint16x8_t vmull_u8(uint8x8_t __p0, uint8x8_t __p1) { 19972 uint16x8_t __ret; 19973 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 19974 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 19975 __ret = (uint16x8_t) __builtin_neon_vmull_v((int8x8_t)__rev0, (int8x8_t)__rev1, 49); 19976 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 19977 return __ret; 19978 } 19979 __ai __attribute__((target("neon"))) uint16x8_t __noswap_vmull_u8(uint8x8_t __p0, uint8x8_t __p1) { 19980 uint16x8_t __ret; 19981 __ret = (uint16x8_t) __builtin_neon_vmull_v((int8x8_t)__p0, (int8x8_t)__p1, 49); 19982 return __ret; 19983 } 19984 #endif 19985 19986 #ifdef __LITTLE_ENDIAN__ 19987 __ai __attribute__((target("neon"))) uint64x2_t vmull_u32(uint32x2_t __p0, uint32x2_t __p1) { 19988 uint64x2_t __ret; 19989 __ret = (uint64x2_t) __builtin_neon_vmull_v((int8x8_t)__p0, (int8x8_t)__p1, 51); 19990 return __ret; 19991 } 19992 #else 19993 __ai __attribute__((target("neon"))) uint64x2_t vmull_u32(uint32x2_t __p0, uint32x2_t __p1) { 19994 uint64x2_t __ret; 19995 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 19996 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 19997 __ret = (uint64x2_t) __builtin_neon_vmull_v((int8x8_t)__rev0, (int8x8_t)__rev1, 51); 19998 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 19999 return __ret; 20000 } 20001 __ai __attribute__((target("neon"))) uint64x2_t __noswap_vmull_u32(uint32x2_t __p0, uint32x2_t __p1) { 20002 uint64x2_t __ret; 20003 __ret = (uint64x2_t) __builtin_neon_vmull_v((int8x8_t)__p0, (int8x8_t)__p1, 51); 20004 return __ret; 20005 } 20006 #endif 20007 20008 #ifdef __LITTLE_ENDIAN__ 20009 __ai __attribute__((target("neon"))) uint32x4_t vmull_u16(uint16x4_t __p0, uint16x4_t __p1) { 20010 uint32x4_t __ret; 20011 __ret = (uint32x4_t) __builtin_neon_vmull_v((int8x8_t)__p0, (int8x8_t)__p1, 50); 20012 return __ret; 20013 } 20014 #else 20015 __ai __attribute__((target("neon"))) uint32x4_t vmull_u16(uint16x4_t __p0, uint16x4_t __p1) { 20016 uint32x4_t __ret; 20017 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 20018 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 20019 __ret = (uint32x4_t) __builtin_neon_vmull_v((int8x8_t)__rev0, (int8x8_t)__rev1, 50); 20020 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 20021 return __ret; 20022 } 20023 __ai __attribute__((target("neon"))) uint32x4_t __noswap_vmull_u16(uint16x4_t __p0, uint16x4_t __p1) { 20024 uint32x4_t __ret; 20025 __ret = (uint32x4_t) __builtin_neon_vmull_v((int8x8_t)__p0, (int8x8_t)__p1, 50); 20026 return __ret; 20027 } 20028 #endif 20029 20030 #ifdef __LITTLE_ENDIAN__ 20031 __ai __attribute__((target("neon"))) int16x8_t vmull_s8(int8x8_t __p0, int8x8_t __p1) { 20032 int16x8_t __ret; 20033 __ret = (int16x8_t) __builtin_neon_vmull_v((int8x8_t)__p0, (int8x8_t)__p1, 33); 20034 return __ret; 20035 } 20036 #else 20037 __ai __attribute__((target("neon"))) int16x8_t vmull_s8(int8x8_t __p0, int8x8_t __p1) { 20038 int16x8_t __ret; 20039 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 20040 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 20041 __ret = (int16x8_t) __builtin_neon_vmull_v((int8x8_t)__rev0, (int8x8_t)__rev1, 33); 20042 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 20043 return __ret; 20044 } 20045 __ai __attribute__((target("neon"))) int16x8_t __noswap_vmull_s8(int8x8_t __p0, int8x8_t __p1) { 20046 int16x8_t __ret; 20047 __ret = (int16x8_t) __builtin_neon_vmull_v((int8x8_t)__p0, (int8x8_t)__p1, 33); 20048 return __ret; 20049 } 20050 #endif 20051 20052 #ifdef __LITTLE_ENDIAN__ 20053 __ai __attribute__((target("neon"))) int64x2_t vmull_s32(int32x2_t __p0, int32x2_t __p1) { 20054 int64x2_t __ret; 20055 __ret = (int64x2_t) __builtin_neon_vmull_v((int8x8_t)__p0, (int8x8_t)__p1, 35); 20056 return __ret; 20057 } 20058 #else 20059 __ai __attribute__((target("neon"))) int64x2_t vmull_s32(int32x2_t __p0, int32x2_t __p1) { 20060 int64x2_t __ret; 20061 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 20062 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 20063 __ret = (int64x2_t) __builtin_neon_vmull_v((int8x8_t)__rev0, (int8x8_t)__rev1, 35); 20064 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 20065 return __ret; 20066 } 20067 __ai __attribute__((target("neon"))) int64x2_t __noswap_vmull_s32(int32x2_t __p0, int32x2_t __p1) { 20068 int64x2_t __ret; 20069 __ret = (int64x2_t) __builtin_neon_vmull_v((int8x8_t)__p0, (int8x8_t)__p1, 35); 20070 return __ret; 20071 } 20072 #endif 20073 20074 #ifdef __LITTLE_ENDIAN__ 20075 __ai __attribute__((target("neon"))) int32x4_t vmull_s16(int16x4_t __p0, int16x4_t __p1) { 20076 int32x4_t __ret; 20077 __ret = (int32x4_t) __builtin_neon_vmull_v((int8x8_t)__p0, (int8x8_t)__p1, 34); 20078 return __ret; 20079 } 20080 #else 20081 __ai __attribute__((target("neon"))) int32x4_t vmull_s16(int16x4_t __p0, int16x4_t __p1) { 20082 int32x4_t __ret; 20083 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 20084 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 20085 __ret = (int32x4_t) __builtin_neon_vmull_v((int8x8_t)__rev0, (int8x8_t)__rev1, 34); 20086 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 20087 return __ret; 20088 } 20089 __ai __attribute__((target("neon"))) int32x4_t __noswap_vmull_s16(int16x4_t __p0, int16x4_t __p1) { 20090 int32x4_t __ret; 20091 __ret = (int32x4_t) __builtin_neon_vmull_v((int8x8_t)__p0, (int8x8_t)__p1, 34); 20092 return __ret; 20093 } 20094 #endif 20095 20096 #ifdef __LITTLE_ENDIAN__ 20097 #define vmull_lane_u32(__p0_114, __p1_114, __p2_114) __extension__ ({ \ 20098 uint64x2_t __ret_114; \ 20099 uint32x2_t __s0_114 = __p0_114; \ 20100 uint32x2_t __s1_114 = __p1_114; \ 20101 __ret_114 = vmull_u32(__s0_114, splat_lane_u32(__s1_114, __p2_114)); \ 20102 __ret_114; \ 20103 }) 20104 #else 20105 #define vmull_lane_u32(__p0_115, __p1_115, __p2_115) __extension__ ({ \ 20106 uint64x2_t __ret_115; \ 20107 uint32x2_t __s0_115 = __p0_115; \ 20108 uint32x2_t __s1_115 = __p1_115; \ 20109 uint32x2_t __rev0_115; __rev0_115 = __builtin_shufflevector(__s0_115, __s0_115, 1, 0); \ 20110 uint32x2_t __rev1_115; __rev1_115 = __builtin_shufflevector(__s1_115, __s1_115, 1, 0); \ 20111 __ret_115 = __noswap_vmull_u32(__rev0_115, __noswap_splat_lane_u32(__rev1_115, __p2_115)); \ 20112 __ret_115 = __builtin_shufflevector(__ret_115, __ret_115, 1, 0); \ 20113 __ret_115; \ 20114 }) 20115 #endif 20116 20117 #ifdef __LITTLE_ENDIAN__ 20118 #define vmull_lane_u16(__p0_116, __p1_116, __p2_116) __extension__ ({ \ 20119 uint32x4_t __ret_116; \ 20120 uint16x4_t __s0_116 = __p0_116; \ 20121 uint16x4_t __s1_116 = __p1_116; \ 20122 __ret_116 = vmull_u16(__s0_116, splat_lane_u16(__s1_116, __p2_116)); \ 20123 __ret_116; \ 20124 }) 20125 #else 20126 #define vmull_lane_u16(__p0_117, __p1_117, __p2_117) __extension__ ({ \ 20127 uint32x4_t __ret_117; \ 20128 uint16x4_t __s0_117 = __p0_117; \ 20129 uint16x4_t __s1_117 = __p1_117; \ 20130 uint16x4_t __rev0_117; __rev0_117 = __builtin_shufflevector(__s0_117, __s0_117, 3, 2, 1, 0); \ 20131 uint16x4_t __rev1_117; __rev1_117 = __builtin_shufflevector(__s1_117, __s1_117, 3, 2, 1, 0); \ 20132 __ret_117 = __noswap_vmull_u16(__rev0_117, __noswap_splat_lane_u16(__rev1_117, __p2_117)); \ 20133 __ret_117 = __builtin_shufflevector(__ret_117, __ret_117, 3, 2, 1, 0); \ 20134 __ret_117; \ 20135 }) 20136 #endif 20137 20138 #ifdef __LITTLE_ENDIAN__ 20139 #define vmull_lane_s32(__p0_118, __p1_118, __p2_118) __extension__ ({ \ 20140 int64x2_t __ret_118; \ 20141 int32x2_t __s0_118 = __p0_118; \ 20142 int32x2_t __s1_118 = __p1_118; \ 20143 __ret_118 = vmull_s32(__s0_118, splat_lane_s32(__s1_118, __p2_118)); \ 20144 __ret_118; \ 20145 }) 20146 #else 20147 #define vmull_lane_s32(__p0_119, __p1_119, __p2_119) __extension__ ({ \ 20148 int64x2_t __ret_119; \ 20149 int32x2_t __s0_119 = __p0_119; \ 20150 int32x2_t __s1_119 = __p1_119; \ 20151 int32x2_t __rev0_119; __rev0_119 = __builtin_shufflevector(__s0_119, __s0_119, 1, 0); \ 20152 int32x2_t __rev1_119; __rev1_119 = __builtin_shufflevector(__s1_119, __s1_119, 1, 0); \ 20153 __ret_119 = __noswap_vmull_s32(__rev0_119, __noswap_splat_lane_s32(__rev1_119, __p2_119)); \ 20154 __ret_119 = __builtin_shufflevector(__ret_119, __ret_119, 1, 0); \ 20155 __ret_119; \ 20156 }) 20157 #endif 20158 20159 #ifdef __LITTLE_ENDIAN__ 20160 #define vmull_lane_s16(__p0_120, __p1_120, __p2_120) __extension__ ({ \ 20161 int32x4_t __ret_120; \ 20162 int16x4_t __s0_120 = __p0_120; \ 20163 int16x4_t __s1_120 = __p1_120; \ 20164 __ret_120 = vmull_s16(__s0_120, splat_lane_s16(__s1_120, __p2_120)); \ 20165 __ret_120; \ 20166 }) 20167 #else 20168 #define vmull_lane_s16(__p0_121, __p1_121, __p2_121) __extension__ ({ \ 20169 int32x4_t __ret_121; \ 20170 int16x4_t __s0_121 = __p0_121; \ 20171 int16x4_t __s1_121 = __p1_121; \ 20172 int16x4_t __rev0_121; __rev0_121 = __builtin_shufflevector(__s0_121, __s0_121, 3, 2, 1, 0); \ 20173 int16x4_t __rev1_121; __rev1_121 = __builtin_shufflevector(__s1_121, __s1_121, 3, 2, 1, 0); \ 20174 __ret_121 = __noswap_vmull_s16(__rev0_121, __noswap_splat_lane_s16(__rev1_121, __p2_121)); \ 20175 __ret_121 = __builtin_shufflevector(__ret_121, __ret_121, 3, 2, 1, 0); \ 20176 __ret_121; \ 20177 }) 20178 #endif 20179 20180 #ifdef __LITTLE_ENDIAN__ 20181 __ai __attribute__((target("neon"))) uint64x2_t vmull_n_u32(uint32x2_t __p0, uint32_t __p1) { 20182 uint64x2_t __ret; 20183 __ret = vmull_u32(__p0, (uint32x2_t) {__p1, __p1}); 20184 return __ret; 20185 } 20186 #else 20187 __ai __attribute__((target("neon"))) uint64x2_t vmull_n_u32(uint32x2_t __p0, uint32_t __p1) { 20188 uint64x2_t __ret; 20189 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 20190 __ret = __noswap_vmull_u32(__rev0, (uint32x2_t) {__p1, __p1}); 20191 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 20192 return __ret; 20193 } 20194 __ai __attribute__((target("neon"))) uint64x2_t __noswap_vmull_n_u32(uint32x2_t __p0, uint32_t __p1) { 20195 uint64x2_t __ret; 20196 __ret = __noswap_vmull_u32(__p0, (uint32x2_t) {__p1, __p1}); 20197 return __ret; 20198 } 20199 #endif 20200 20201 #ifdef __LITTLE_ENDIAN__ 20202 __ai __attribute__((target("neon"))) uint32x4_t vmull_n_u16(uint16x4_t __p0, uint16_t __p1) { 20203 uint32x4_t __ret; 20204 __ret = vmull_u16(__p0, (uint16x4_t) {__p1, __p1, __p1, __p1}); 20205 return __ret; 20206 } 20207 #else 20208 __ai __attribute__((target("neon"))) uint32x4_t vmull_n_u16(uint16x4_t __p0, uint16_t __p1) { 20209 uint32x4_t __ret; 20210 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 20211 __ret = __noswap_vmull_u16(__rev0, (uint16x4_t) {__p1, __p1, __p1, __p1}); 20212 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 20213 return __ret; 20214 } 20215 __ai __attribute__((target("neon"))) uint32x4_t __noswap_vmull_n_u16(uint16x4_t __p0, uint16_t __p1) { 20216 uint32x4_t __ret; 20217 __ret = __noswap_vmull_u16(__p0, (uint16x4_t) {__p1, __p1, __p1, __p1}); 20218 return __ret; 20219 } 20220 #endif 20221 20222 #ifdef __LITTLE_ENDIAN__ 20223 __ai __attribute__((target("neon"))) int64x2_t vmull_n_s32(int32x2_t __p0, int32_t __p1) { 20224 int64x2_t __ret; 20225 __ret = vmull_s32(__p0, (int32x2_t) {__p1, __p1}); 20226 return __ret; 20227 } 20228 #else 20229 __ai __attribute__((target("neon"))) int64x2_t vmull_n_s32(int32x2_t __p0, int32_t __p1) { 20230 int64x2_t __ret; 20231 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 20232 __ret = __noswap_vmull_s32(__rev0, (int32x2_t) {__p1, __p1}); 20233 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 20234 return __ret; 20235 } 20236 __ai __attribute__((target("neon"))) int64x2_t __noswap_vmull_n_s32(int32x2_t __p0, int32_t __p1) { 20237 int64x2_t __ret; 20238 __ret = __noswap_vmull_s32(__p0, (int32x2_t) {__p1, __p1}); 20239 return __ret; 20240 } 20241 #endif 20242 20243 #ifdef __LITTLE_ENDIAN__ 20244 __ai __attribute__((target("neon"))) int32x4_t vmull_n_s16(int16x4_t __p0, int16_t __p1) { 20245 int32x4_t __ret; 20246 __ret = vmull_s16(__p0, (int16x4_t) {__p1, __p1, __p1, __p1}); 20247 return __ret; 20248 } 20249 #else 20250 __ai __attribute__((target("neon"))) int32x4_t vmull_n_s16(int16x4_t __p0, int16_t __p1) { 20251 int32x4_t __ret; 20252 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 20253 __ret = __noswap_vmull_s16(__rev0, (int16x4_t) {__p1, __p1, __p1, __p1}); 20254 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 20255 return __ret; 20256 } 20257 __ai __attribute__((target("neon"))) int32x4_t __noswap_vmull_n_s16(int16x4_t __p0, int16_t __p1) { 20258 int32x4_t __ret; 20259 __ret = __noswap_vmull_s16(__p0, (int16x4_t) {__p1, __p1, __p1, __p1}); 20260 return __ret; 20261 } 20262 #endif 20263 20264 #ifdef __LITTLE_ENDIAN__ 20265 __ai __attribute__((target("neon"))) poly8x8_t vmvn_p8(poly8x8_t __p0) { 20266 poly8x8_t __ret; 20267 __ret = ~__p0; 20268 return __ret; 20269 } 20270 #else 20271 __ai __attribute__((target("neon"))) poly8x8_t vmvn_p8(poly8x8_t __p0) { 20272 poly8x8_t __ret; 20273 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 20274 __ret = ~__rev0; 20275 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 20276 return __ret; 20277 } 20278 #endif 20279 20280 #ifdef __LITTLE_ENDIAN__ 20281 __ai __attribute__((target("neon"))) poly8x16_t vmvnq_p8(poly8x16_t __p0) { 20282 poly8x16_t __ret; 20283 __ret = ~__p0; 20284 return __ret; 20285 } 20286 #else 20287 __ai __attribute__((target("neon"))) poly8x16_t vmvnq_p8(poly8x16_t __p0) { 20288 poly8x16_t __ret; 20289 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 20290 __ret = ~__rev0; 20291 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 20292 return __ret; 20293 } 20294 #endif 20295 20296 #ifdef __LITTLE_ENDIAN__ 20297 __ai __attribute__((target("neon"))) uint8x16_t vmvnq_u8(uint8x16_t __p0) { 20298 uint8x16_t __ret; 20299 __ret = ~__p0; 20300 return __ret; 20301 } 20302 #else 20303 __ai __attribute__((target("neon"))) uint8x16_t vmvnq_u8(uint8x16_t __p0) { 20304 uint8x16_t __ret; 20305 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 20306 __ret = ~__rev0; 20307 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 20308 return __ret; 20309 } 20310 #endif 20311 20312 #ifdef __LITTLE_ENDIAN__ 20313 __ai __attribute__((target("neon"))) uint32x4_t vmvnq_u32(uint32x4_t __p0) { 20314 uint32x4_t __ret; 20315 __ret = ~__p0; 20316 return __ret; 20317 } 20318 #else 20319 __ai __attribute__((target("neon"))) uint32x4_t vmvnq_u32(uint32x4_t __p0) { 20320 uint32x4_t __ret; 20321 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 20322 __ret = ~__rev0; 20323 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 20324 return __ret; 20325 } 20326 #endif 20327 20328 #ifdef __LITTLE_ENDIAN__ 20329 __ai __attribute__((target("neon"))) uint16x8_t vmvnq_u16(uint16x8_t __p0) { 20330 uint16x8_t __ret; 20331 __ret = ~__p0; 20332 return __ret; 20333 } 20334 #else 20335 __ai __attribute__((target("neon"))) uint16x8_t vmvnq_u16(uint16x8_t __p0) { 20336 uint16x8_t __ret; 20337 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 20338 __ret = ~__rev0; 20339 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 20340 return __ret; 20341 } 20342 #endif 20343 20344 #ifdef __LITTLE_ENDIAN__ 20345 __ai __attribute__((target("neon"))) int8x16_t vmvnq_s8(int8x16_t __p0) { 20346 int8x16_t __ret; 20347 __ret = ~__p0; 20348 return __ret; 20349 } 20350 #else 20351 __ai __attribute__((target("neon"))) int8x16_t vmvnq_s8(int8x16_t __p0) { 20352 int8x16_t __ret; 20353 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 20354 __ret = ~__rev0; 20355 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 20356 return __ret; 20357 } 20358 #endif 20359 20360 #ifdef __LITTLE_ENDIAN__ 20361 __ai __attribute__((target("neon"))) int32x4_t vmvnq_s32(int32x4_t __p0) { 20362 int32x4_t __ret; 20363 __ret = ~__p0; 20364 return __ret; 20365 } 20366 #else 20367 __ai __attribute__((target("neon"))) int32x4_t vmvnq_s32(int32x4_t __p0) { 20368 int32x4_t __ret; 20369 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 20370 __ret = ~__rev0; 20371 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 20372 return __ret; 20373 } 20374 #endif 20375 20376 #ifdef __LITTLE_ENDIAN__ 20377 __ai __attribute__((target("neon"))) int16x8_t vmvnq_s16(int16x8_t __p0) { 20378 int16x8_t __ret; 20379 __ret = ~__p0; 20380 return __ret; 20381 } 20382 #else 20383 __ai __attribute__((target("neon"))) int16x8_t vmvnq_s16(int16x8_t __p0) { 20384 int16x8_t __ret; 20385 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 20386 __ret = ~__rev0; 20387 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 20388 return __ret; 20389 } 20390 #endif 20391 20392 #ifdef __LITTLE_ENDIAN__ 20393 __ai __attribute__((target("neon"))) uint8x8_t vmvn_u8(uint8x8_t __p0) { 20394 uint8x8_t __ret; 20395 __ret = ~__p0; 20396 return __ret; 20397 } 20398 #else 20399 __ai __attribute__((target("neon"))) uint8x8_t vmvn_u8(uint8x8_t __p0) { 20400 uint8x8_t __ret; 20401 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 20402 __ret = ~__rev0; 20403 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 20404 return __ret; 20405 } 20406 #endif 20407 20408 #ifdef __LITTLE_ENDIAN__ 20409 __ai __attribute__((target("neon"))) uint32x2_t vmvn_u32(uint32x2_t __p0) { 20410 uint32x2_t __ret; 20411 __ret = ~__p0; 20412 return __ret; 20413 } 20414 #else 20415 __ai __attribute__((target("neon"))) uint32x2_t vmvn_u32(uint32x2_t __p0) { 20416 uint32x2_t __ret; 20417 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 20418 __ret = ~__rev0; 20419 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 20420 return __ret; 20421 } 20422 #endif 20423 20424 #ifdef __LITTLE_ENDIAN__ 20425 __ai __attribute__((target("neon"))) uint16x4_t vmvn_u16(uint16x4_t __p0) { 20426 uint16x4_t __ret; 20427 __ret = ~__p0; 20428 return __ret; 20429 } 20430 #else 20431 __ai __attribute__((target("neon"))) uint16x4_t vmvn_u16(uint16x4_t __p0) { 20432 uint16x4_t __ret; 20433 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 20434 __ret = ~__rev0; 20435 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 20436 return __ret; 20437 } 20438 #endif 20439 20440 #ifdef __LITTLE_ENDIAN__ 20441 __ai __attribute__((target("neon"))) int8x8_t vmvn_s8(int8x8_t __p0) { 20442 int8x8_t __ret; 20443 __ret = ~__p0; 20444 return __ret; 20445 } 20446 #else 20447 __ai __attribute__((target("neon"))) int8x8_t vmvn_s8(int8x8_t __p0) { 20448 int8x8_t __ret; 20449 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 20450 __ret = ~__rev0; 20451 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 20452 return __ret; 20453 } 20454 #endif 20455 20456 #ifdef __LITTLE_ENDIAN__ 20457 __ai __attribute__((target("neon"))) int32x2_t vmvn_s32(int32x2_t __p0) { 20458 int32x2_t __ret; 20459 __ret = ~__p0; 20460 return __ret; 20461 } 20462 #else 20463 __ai __attribute__((target("neon"))) int32x2_t vmvn_s32(int32x2_t __p0) { 20464 int32x2_t __ret; 20465 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 20466 __ret = ~__rev0; 20467 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 20468 return __ret; 20469 } 20470 #endif 20471 20472 #ifdef __LITTLE_ENDIAN__ 20473 __ai __attribute__((target("neon"))) int16x4_t vmvn_s16(int16x4_t __p0) { 20474 int16x4_t __ret; 20475 __ret = ~__p0; 20476 return __ret; 20477 } 20478 #else 20479 __ai __attribute__((target("neon"))) int16x4_t vmvn_s16(int16x4_t __p0) { 20480 int16x4_t __ret; 20481 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 20482 __ret = ~__rev0; 20483 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 20484 return __ret; 20485 } 20486 #endif 20487 20488 #ifdef __LITTLE_ENDIAN__ 20489 __ai __attribute__((target("neon"))) int8x16_t vnegq_s8(int8x16_t __p0) { 20490 int8x16_t __ret; 20491 __ret = -__p0; 20492 return __ret; 20493 } 20494 #else 20495 __ai __attribute__((target("neon"))) int8x16_t vnegq_s8(int8x16_t __p0) { 20496 int8x16_t __ret; 20497 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 20498 __ret = -__rev0; 20499 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 20500 return __ret; 20501 } 20502 #endif 20503 20504 #ifdef __LITTLE_ENDIAN__ 20505 __ai __attribute__((target("neon"))) float32x4_t vnegq_f32(float32x4_t __p0) { 20506 float32x4_t __ret; 20507 __ret = -__p0; 20508 return __ret; 20509 } 20510 #else 20511 __ai __attribute__((target("neon"))) float32x4_t vnegq_f32(float32x4_t __p0) { 20512 float32x4_t __ret; 20513 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 20514 __ret = -__rev0; 20515 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 20516 return __ret; 20517 } 20518 #endif 20519 20520 #ifdef __LITTLE_ENDIAN__ 20521 __ai __attribute__((target("neon"))) int32x4_t vnegq_s32(int32x4_t __p0) { 20522 int32x4_t __ret; 20523 __ret = -__p0; 20524 return __ret; 20525 } 20526 #else 20527 __ai __attribute__((target("neon"))) int32x4_t vnegq_s32(int32x4_t __p0) { 20528 int32x4_t __ret; 20529 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 20530 __ret = -__rev0; 20531 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 20532 return __ret; 20533 } 20534 #endif 20535 20536 #ifdef __LITTLE_ENDIAN__ 20537 __ai __attribute__((target("neon"))) int16x8_t vnegq_s16(int16x8_t __p0) { 20538 int16x8_t __ret; 20539 __ret = -__p0; 20540 return __ret; 20541 } 20542 #else 20543 __ai __attribute__((target("neon"))) int16x8_t vnegq_s16(int16x8_t __p0) { 20544 int16x8_t __ret; 20545 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 20546 __ret = -__rev0; 20547 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 20548 return __ret; 20549 } 20550 #endif 20551 20552 #ifdef __LITTLE_ENDIAN__ 20553 __ai __attribute__((target("neon"))) int8x8_t vneg_s8(int8x8_t __p0) { 20554 int8x8_t __ret; 20555 __ret = -__p0; 20556 return __ret; 20557 } 20558 #else 20559 __ai __attribute__((target("neon"))) int8x8_t vneg_s8(int8x8_t __p0) { 20560 int8x8_t __ret; 20561 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 20562 __ret = -__rev0; 20563 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 20564 return __ret; 20565 } 20566 #endif 20567 20568 #ifdef __LITTLE_ENDIAN__ 20569 __ai __attribute__((target("neon"))) float32x2_t vneg_f32(float32x2_t __p0) { 20570 float32x2_t __ret; 20571 __ret = -__p0; 20572 return __ret; 20573 } 20574 #else 20575 __ai __attribute__((target("neon"))) float32x2_t vneg_f32(float32x2_t __p0) { 20576 float32x2_t __ret; 20577 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 20578 __ret = -__rev0; 20579 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 20580 return __ret; 20581 } 20582 #endif 20583 20584 #ifdef __LITTLE_ENDIAN__ 20585 __ai __attribute__((target("neon"))) int32x2_t vneg_s32(int32x2_t __p0) { 20586 int32x2_t __ret; 20587 __ret = -__p0; 20588 return __ret; 20589 } 20590 #else 20591 __ai __attribute__((target("neon"))) int32x2_t vneg_s32(int32x2_t __p0) { 20592 int32x2_t __ret; 20593 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 20594 __ret = -__rev0; 20595 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 20596 return __ret; 20597 } 20598 #endif 20599 20600 #ifdef __LITTLE_ENDIAN__ 20601 __ai __attribute__((target("neon"))) int16x4_t vneg_s16(int16x4_t __p0) { 20602 int16x4_t __ret; 20603 __ret = -__p0; 20604 return __ret; 20605 } 20606 #else 20607 __ai __attribute__((target("neon"))) int16x4_t vneg_s16(int16x4_t __p0) { 20608 int16x4_t __ret; 20609 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 20610 __ret = -__rev0; 20611 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 20612 return __ret; 20613 } 20614 #endif 20615 20616 #ifdef __LITTLE_ENDIAN__ 20617 __ai __attribute__((target("neon"))) uint8x16_t vornq_u8(uint8x16_t __p0, uint8x16_t __p1) { 20618 uint8x16_t __ret; 20619 __ret = __p0 | ~__p1; 20620 return __ret; 20621 } 20622 #else 20623 __ai __attribute__((target("neon"))) uint8x16_t vornq_u8(uint8x16_t __p0, uint8x16_t __p1) { 20624 uint8x16_t __ret; 20625 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 20626 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 20627 __ret = __rev0 | ~__rev1; 20628 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 20629 return __ret; 20630 } 20631 #endif 20632 20633 #ifdef __LITTLE_ENDIAN__ 20634 __ai __attribute__((target("neon"))) uint32x4_t vornq_u32(uint32x4_t __p0, uint32x4_t __p1) { 20635 uint32x4_t __ret; 20636 __ret = __p0 | ~__p1; 20637 return __ret; 20638 } 20639 #else 20640 __ai __attribute__((target("neon"))) uint32x4_t vornq_u32(uint32x4_t __p0, uint32x4_t __p1) { 20641 uint32x4_t __ret; 20642 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 20643 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 20644 __ret = __rev0 | ~__rev1; 20645 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 20646 return __ret; 20647 } 20648 #endif 20649 20650 #ifdef __LITTLE_ENDIAN__ 20651 __ai __attribute__((target("neon"))) uint64x2_t vornq_u64(uint64x2_t __p0, uint64x2_t __p1) { 20652 uint64x2_t __ret; 20653 __ret = __p0 | ~__p1; 20654 return __ret; 20655 } 20656 #else 20657 __ai __attribute__((target("neon"))) uint64x2_t vornq_u64(uint64x2_t __p0, uint64x2_t __p1) { 20658 uint64x2_t __ret; 20659 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 20660 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 20661 __ret = __rev0 | ~__rev1; 20662 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 20663 return __ret; 20664 } 20665 #endif 20666 20667 #ifdef __LITTLE_ENDIAN__ 20668 __ai __attribute__((target("neon"))) uint16x8_t vornq_u16(uint16x8_t __p0, uint16x8_t __p1) { 20669 uint16x8_t __ret; 20670 __ret = __p0 | ~__p1; 20671 return __ret; 20672 } 20673 #else 20674 __ai __attribute__((target("neon"))) uint16x8_t vornq_u16(uint16x8_t __p0, uint16x8_t __p1) { 20675 uint16x8_t __ret; 20676 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 20677 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 20678 __ret = __rev0 | ~__rev1; 20679 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 20680 return __ret; 20681 } 20682 #endif 20683 20684 #ifdef __LITTLE_ENDIAN__ 20685 __ai __attribute__((target("neon"))) int8x16_t vornq_s8(int8x16_t __p0, int8x16_t __p1) { 20686 int8x16_t __ret; 20687 __ret = __p0 | ~__p1; 20688 return __ret; 20689 } 20690 #else 20691 __ai __attribute__((target("neon"))) int8x16_t vornq_s8(int8x16_t __p0, int8x16_t __p1) { 20692 int8x16_t __ret; 20693 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 20694 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 20695 __ret = __rev0 | ~__rev1; 20696 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 20697 return __ret; 20698 } 20699 #endif 20700 20701 #ifdef __LITTLE_ENDIAN__ 20702 __ai __attribute__((target("neon"))) int32x4_t vornq_s32(int32x4_t __p0, int32x4_t __p1) { 20703 int32x4_t __ret; 20704 __ret = __p0 | ~__p1; 20705 return __ret; 20706 } 20707 #else 20708 __ai __attribute__((target("neon"))) int32x4_t vornq_s32(int32x4_t __p0, int32x4_t __p1) { 20709 int32x4_t __ret; 20710 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 20711 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 20712 __ret = __rev0 | ~__rev1; 20713 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 20714 return __ret; 20715 } 20716 #endif 20717 20718 #ifdef __LITTLE_ENDIAN__ 20719 __ai __attribute__((target("neon"))) int64x2_t vornq_s64(int64x2_t __p0, int64x2_t __p1) { 20720 int64x2_t __ret; 20721 __ret = __p0 | ~__p1; 20722 return __ret; 20723 } 20724 #else 20725 __ai __attribute__((target("neon"))) int64x2_t vornq_s64(int64x2_t __p0, int64x2_t __p1) { 20726 int64x2_t __ret; 20727 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 20728 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 20729 __ret = __rev0 | ~__rev1; 20730 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 20731 return __ret; 20732 } 20733 #endif 20734 20735 #ifdef __LITTLE_ENDIAN__ 20736 __ai __attribute__((target("neon"))) int16x8_t vornq_s16(int16x8_t __p0, int16x8_t __p1) { 20737 int16x8_t __ret; 20738 __ret = __p0 | ~__p1; 20739 return __ret; 20740 } 20741 #else 20742 __ai __attribute__((target("neon"))) int16x8_t vornq_s16(int16x8_t __p0, int16x8_t __p1) { 20743 int16x8_t __ret; 20744 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 20745 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 20746 __ret = __rev0 | ~__rev1; 20747 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 20748 return __ret; 20749 } 20750 #endif 20751 20752 #ifdef __LITTLE_ENDIAN__ 20753 __ai __attribute__((target("neon"))) uint8x8_t vorn_u8(uint8x8_t __p0, uint8x8_t __p1) { 20754 uint8x8_t __ret; 20755 __ret = __p0 | ~__p1; 20756 return __ret; 20757 } 20758 #else 20759 __ai __attribute__((target("neon"))) uint8x8_t vorn_u8(uint8x8_t __p0, uint8x8_t __p1) { 20760 uint8x8_t __ret; 20761 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 20762 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 20763 __ret = __rev0 | ~__rev1; 20764 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 20765 return __ret; 20766 } 20767 #endif 20768 20769 #ifdef __LITTLE_ENDIAN__ 20770 __ai __attribute__((target("neon"))) uint32x2_t vorn_u32(uint32x2_t __p0, uint32x2_t __p1) { 20771 uint32x2_t __ret; 20772 __ret = __p0 | ~__p1; 20773 return __ret; 20774 } 20775 #else 20776 __ai __attribute__((target("neon"))) uint32x2_t vorn_u32(uint32x2_t __p0, uint32x2_t __p1) { 20777 uint32x2_t __ret; 20778 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 20779 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 20780 __ret = __rev0 | ~__rev1; 20781 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 20782 return __ret; 20783 } 20784 #endif 20785 20786 __ai __attribute__((target("neon"))) uint64x1_t vorn_u64(uint64x1_t __p0, uint64x1_t __p1) { 20787 uint64x1_t __ret; 20788 __ret = __p0 | ~__p1; 20789 return __ret; 20790 } 20791 #ifdef __LITTLE_ENDIAN__ 20792 __ai __attribute__((target("neon"))) uint16x4_t vorn_u16(uint16x4_t __p0, uint16x4_t __p1) { 20793 uint16x4_t __ret; 20794 __ret = __p0 | ~__p1; 20795 return __ret; 20796 } 20797 #else 20798 __ai __attribute__((target("neon"))) uint16x4_t vorn_u16(uint16x4_t __p0, uint16x4_t __p1) { 20799 uint16x4_t __ret; 20800 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 20801 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 20802 __ret = __rev0 | ~__rev1; 20803 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 20804 return __ret; 20805 } 20806 #endif 20807 20808 #ifdef __LITTLE_ENDIAN__ 20809 __ai __attribute__((target("neon"))) int8x8_t vorn_s8(int8x8_t __p0, int8x8_t __p1) { 20810 int8x8_t __ret; 20811 __ret = __p0 | ~__p1; 20812 return __ret; 20813 } 20814 #else 20815 __ai __attribute__((target("neon"))) int8x8_t vorn_s8(int8x8_t __p0, int8x8_t __p1) { 20816 int8x8_t __ret; 20817 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 20818 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 20819 __ret = __rev0 | ~__rev1; 20820 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 20821 return __ret; 20822 } 20823 #endif 20824 20825 #ifdef __LITTLE_ENDIAN__ 20826 __ai __attribute__((target("neon"))) int32x2_t vorn_s32(int32x2_t __p0, int32x2_t __p1) { 20827 int32x2_t __ret; 20828 __ret = __p0 | ~__p1; 20829 return __ret; 20830 } 20831 #else 20832 __ai __attribute__((target("neon"))) int32x2_t vorn_s32(int32x2_t __p0, int32x2_t __p1) { 20833 int32x2_t __ret; 20834 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 20835 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 20836 __ret = __rev0 | ~__rev1; 20837 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 20838 return __ret; 20839 } 20840 #endif 20841 20842 __ai __attribute__((target("neon"))) int64x1_t vorn_s64(int64x1_t __p0, int64x1_t __p1) { 20843 int64x1_t __ret; 20844 __ret = __p0 | ~__p1; 20845 return __ret; 20846 } 20847 #ifdef __LITTLE_ENDIAN__ 20848 __ai __attribute__((target("neon"))) int16x4_t vorn_s16(int16x4_t __p0, int16x4_t __p1) { 20849 int16x4_t __ret; 20850 __ret = __p0 | ~__p1; 20851 return __ret; 20852 } 20853 #else 20854 __ai __attribute__((target("neon"))) int16x4_t vorn_s16(int16x4_t __p0, int16x4_t __p1) { 20855 int16x4_t __ret; 20856 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 20857 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 20858 __ret = __rev0 | ~__rev1; 20859 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 20860 return __ret; 20861 } 20862 #endif 20863 20864 #ifdef __LITTLE_ENDIAN__ 20865 __ai __attribute__((target("neon"))) uint8x16_t vorrq_u8(uint8x16_t __p0, uint8x16_t __p1) { 20866 uint8x16_t __ret; 20867 __ret = __p0 | __p1; 20868 return __ret; 20869 } 20870 #else 20871 __ai __attribute__((target("neon"))) uint8x16_t vorrq_u8(uint8x16_t __p0, uint8x16_t __p1) { 20872 uint8x16_t __ret; 20873 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 20874 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 20875 __ret = __rev0 | __rev1; 20876 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 20877 return __ret; 20878 } 20879 #endif 20880 20881 #ifdef __LITTLE_ENDIAN__ 20882 __ai __attribute__((target("neon"))) uint32x4_t vorrq_u32(uint32x4_t __p0, uint32x4_t __p1) { 20883 uint32x4_t __ret; 20884 __ret = __p0 | __p1; 20885 return __ret; 20886 } 20887 #else 20888 __ai __attribute__((target("neon"))) uint32x4_t vorrq_u32(uint32x4_t __p0, uint32x4_t __p1) { 20889 uint32x4_t __ret; 20890 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 20891 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 20892 __ret = __rev0 | __rev1; 20893 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 20894 return __ret; 20895 } 20896 #endif 20897 20898 #ifdef __LITTLE_ENDIAN__ 20899 __ai __attribute__((target("neon"))) uint64x2_t vorrq_u64(uint64x2_t __p0, uint64x2_t __p1) { 20900 uint64x2_t __ret; 20901 __ret = __p0 | __p1; 20902 return __ret; 20903 } 20904 #else 20905 __ai __attribute__((target("neon"))) uint64x2_t vorrq_u64(uint64x2_t __p0, uint64x2_t __p1) { 20906 uint64x2_t __ret; 20907 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 20908 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 20909 __ret = __rev0 | __rev1; 20910 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 20911 return __ret; 20912 } 20913 #endif 20914 20915 #ifdef __LITTLE_ENDIAN__ 20916 __ai __attribute__((target("neon"))) uint16x8_t vorrq_u16(uint16x8_t __p0, uint16x8_t __p1) { 20917 uint16x8_t __ret; 20918 __ret = __p0 | __p1; 20919 return __ret; 20920 } 20921 #else 20922 __ai __attribute__((target("neon"))) uint16x8_t vorrq_u16(uint16x8_t __p0, uint16x8_t __p1) { 20923 uint16x8_t __ret; 20924 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 20925 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 20926 __ret = __rev0 | __rev1; 20927 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 20928 return __ret; 20929 } 20930 #endif 20931 20932 #ifdef __LITTLE_ENDIAN__ 20933 __ai __attribute__((target("neon"))) int8x16_t vorrq_s8(int8x16_t __p0, int8x16_t __p1) { 20934 int8x16_t __ret; 20935 __ret = __p0 | __p1; 20936 return __ret; 20937 } 20938 #else 20939 __ai __attribute__((target("neon"))) int8x16_t vorrq_s8(int8x16_t __p0, int8x16_t __p1) { 20940 int8x16_t __ret; 20941 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 20942 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 20943 __ret = __rev0 | __rev1; 20944 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 20945 return __ret; 20946 } 20947 #endif 20948 20949 #ifdef __LITTLE_ENDIAN__ 20950 __ai __attribute__((target("neon"))) int32x4_t vorrq_s32(int32x4_t __p0, int32x4_t __p1) { 20951 int32x4_t __ret; 20952 __ret = __p0 | __p1; 20953 return __ret; 20954 } 20955 #else 20956 __ai __attribute__((target("neon"))) int32x4_t vorrq_s32(int32x4_t __p0, int32x4_t __p1) { 20957 int32x4_t __ret; 20958 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 20959 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 20960 __ret = __rev0 | __rev1; 20961 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 20962 return __ret; 20963 } 20964 #endif 20965 20966 #ifdef __LITTLE_ENDIAN__ 20967 __ai __attribute__((target("neon"))) int64x2_t vorrq_s64(int64x2_t __p0, int64x2_t __p1) { 20968 int64x2_t __ret; 20969 __ret = __p0 | __p1; 20970 return __ret; 20971 } 20972 #else 20973 __ai __attribute__((target("neon"))) int64x2_t vorrq_s64(int64x2_t __p0, int64x2_t __p1) { 20974 int64x2_t __ret; 20975 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 20976 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 20977 __ret = __rev0 | __rev1; 20978 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 20979 return __ret; 20980 } 20981 #endif 20982 20983 #ifdef __LITTLE_ENDIAN__ 20984 __ai __attribute__((target("neon"))) int16x8_t vorrq_s16(int16x8_t __p0, int16x8_t __p1) { 20985 int16x8_t __ret; 20986 __ret = __p0 | __p1; 20987 return __ret; 20988 } 20989 #else 20990 __ai __attribute__((target("neon"))) int16x8_t vorrq_s16(int16x8_t __p0, int16x8_t __p1) { 20991 int16x8_t __ret; 20992 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 20993 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 20994 __ret = __rev0 | __rev1; 20995 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 20996 return __ret; 20997 } 20998 #endif 20999 21000 #ifdef __LITTLE_ENDIAN__ 21001 __ai __attribute__((target("neon"))) uint8x8_t vorr_u8(uint8x8_t __p0, uint8x8_t __p1) { 21002 uint8x8_t __ret; 21003 __ret = __p0 | __p1; 21004 return __ret; 21005 } 21006 #else 21007 __ai __attribute__((target("neon"))) uint8x8_t vorr_u8(uint8x8_t __p0, uint8x8_t __p1) { 21008 uint8x8_t __ret; 21009 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 21010 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 21011 __ret = __rev0 | __rev1; 21012 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 21013 return __ret; 21014 } 21015 #endif 21016 21017 #ifdef __LITTLE_ENDIAN__ 21018 __ai __attribute__((target("neon"))) uint32x2_t vorr_u32(uint32x2_t __p0, uint32x2_t __p1) { 21019 uint32x2_t __ret; 21020 __ret = __p0 | __p1; 21021 return __ret; 21022 } 21023 #else 21024 __ai __attribute__((target("neon"))) uint32x2_t vorr_u32(uint32x2_t __p0, uint32x2_t __p1) { 21025 uint32x2_t __ret; 21026 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 21027 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 21028 __ret = __rev0 | __rev1; 21029 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 21030 return __ret; 21031 } 21032 #endif 21033 21034 __ai __attribute__((target("neon"))) uint64x1_t vorr_u64(uint64x1_t __p0, uint64x1_t __p1) { 21035 uint64x1_t __ret; 21036 __ret = __p0 | __p1; 21037 return __ret; 21038 } 21039 #ifdef __LITTLE_ENDIAN__ 21040 __ai __attribute__((target("neon"))) uint16x4_t vorr_u16(uint16x4_t __p0, uint16x4_t __p1) { 21041 uint16x4_t __ret; 21042 __ret = __p0 | __p1; 21043 return __ret; 21044 } 21045 #else 21046 __ai __attribute__((target("neon"))) uint16x4_t vorr_u16(uint16x4_t __p0, uint16x4_t __p1) { 21047 uint16x4_t __ret; 21048 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 21049 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 21050 __ret = __rev0 | __rev1; 21051 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 21052 return __ret; 21053 } 21054 #endif 21055 21056 #ifdef __LITTLE_ENDIAN__ 21057 __ai __attribute__((target("neon"))) int8x8_t vorr_s8(int8x8_t __p0, int8x8_t __p1) { 21058 int8x8_t __ret; 21059 __ret = __p0 | __p1; 21060 return __ret; 21061 } 21062 #else 21063 __ai __attribute__((target("neon"))) int8x8_t vorr_s8(int8x8_t __p0, int8x8_t __p1) { 21064 int8x8_t __ret; 21065 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 21066 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 21067 __ret = __rev0 | __rev1; 21068 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 21069 return __ret; 21070 } 21071 #endif 21072 21073 #ifdef __LITTLE_ENDIAN__ 21074 __ai __attribute__((target("neon"))) int32x2_t vorr_s32(int32x2_t __p0, int32x2_t __p1) { 21075 int32x2_t __ret; 21076 __ret = __p0 | __p1; 21077 return __ret; 21078 } 21079 #else 21080 __ai __attribute__((target("neon"))) int32x2_t vorr_s32(int32x2_t __p0, int32x2_t __p1) { 21081 int32x2_t __ret; 21082 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 21083 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 21084 __ret = __rev0 | __rev1; 21085 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 21086 return __ret; 21087 } 21088 #endif 21089 21090 __ai __attribute__((target("neon"))) int64x1_t vorr_s64(int64x1_t __p0, int64x1_t __p1) { 21091 int64x1_t __ret; 21092 __ret = __p0 | __p1; 21093 return __ret; 21094 } 21095 #ifdef __LITTLE_ENDIAN__ 21096 __ai __attribute__((target("neon"))) int16x4_t vorr_s16(int16x4_t __p0, int16x4_t __p1) { 21097 int16x4_t __ret; 21098 __ret = __p0 | __p1; 21099 return __ret; 21100 } 21101 #else 21102 __ai __attribute__((target("neon"))) int16x4_t vorr_s16(int16x4_t __p0, int16x4_t __p1) { 21103 int16x4_t __ret; 21104 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 21105 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 21106 __ret = __rev0 | __rev1; 21107 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 21108 return __ret; 21109 } 21110 #endif 21111 21112 #ifdef __LITTLE_ENDIAN__ 21113 __ai __attribute__((target("neon"))) uint16x8_t vpadalq_u8(uint16x8_t __p0, uint8x16_t __p1) { 21114 uint16x8_t __ret; 21115 __ret = (uint16x8_t) __builtin_neon_vpadalq_v((int8x16_t)__p0, (int8x16_t)__p1, 49); 21116 return __ret; 21117 } 21118 #else 21119 __ai __attribute__((target("neon"))) uint16x8_t vpadalq_u8(uint16x8_t __p0, uint8x16_t __p1) { 21120 uint16x8_t __ret; 21121 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 21122 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 21123 __ret = (uint16x8_t) __builtin_neon_vpadalq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49); 21124 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 21125 return __ret; 21126 } 21127 #endif 21128 21129 #ifdef __LITTLE_ENDIAN__ 21130 __ai __attribute__((target("neon"))) uint64x2_t vpadalq_u32(uint64x2_t __p0, uint32x4_t __p1) { 21131 uint64x2_t __ret; 21132 __ret = (uint64x2_t) __builtin_neon_vpadalq_v((int8x16_t)__p0, (int8x16_t)__p1, 51); 21133 return __ret; 21134 } 21135 #else 21136 __ai __attribute__((target("neon"))) uint64x2_t vpadalq_u32(uint64x2_t __p0, uint32x4_t __p1) { 21137 uint64x2_t __ret; 21138 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 21139 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 21140 __ret = (uint64x2_t) __builtin_neon_vpadalq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 51); 21141 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 21142 return __ret; 21143 } 21144 #endif 21145 21146 #ifdef __LITTLE_ENDIAN__ 21147 __ai __attribute__((target("neon"))) uint32x4_t vpadalq_u16(uint32x4_t __p0, uint16x8_t __p1) { 21148 uint32x4_t __ret; 21149 __ret = (uint32x4_t) __builtin_neon_vpadalq_v((int8x16_t)__p0, (int8x16_t)__p1, 50); 21150 return __ret; 21151 } 21152 #else 21153 __ai __attribute__((target("neon"))) uint32x4_t vpadalq_u16(uint32x4_t __p0, uint16x8_t __p1) { 21154 uint32x4_t __ret; 21155 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 21156 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 21157 __ret = (uint32x4_t) __builtin_neon_vpadalq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50); 21158 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 21159 return __ret; 21160 } 21161 #endif 21162 21163 #ifdef __LITTLE_ENDIAN__ 21164 __ai __attribute__((target("neon"))) int16x8_t vpadalq_s8(int16x8_t __p0, int8x16_t __p1) { 21165 int16x8_t __ret; 21166 __ret = (int16x8_t) __builtin_neon_vpadalq_v((int8x16_t)__p0, (int8x16_t)__p1, 33); 21167 return __ret; 21168 } 21169 #else 21170 __ai __attribute__((target("neon"))) int16x8_t vpadalq_s8(int16x8_t __p0, int8x16_t __p1) { 21171 int16x8_t __ret; 21172 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 21173 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 21174 __ret = (int16x8_t) __builtin_neon_vpadalq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33); 21175 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 21176 return __ret; 21177 } 21178 #endif 21179 21180 #ifdef __LITTLE_ENDIAN__ 21181 __ai __attribute__((target("neon"))) int64x2_t vpadalq_s32(int64x2_t __p0, int32x4_t __p1) { 21182 int64x2_t __ret; 21183 __ret = (int64x2_t) __builtin_neon_vpadalq_v((int8x16_t)__p0, (int8x16_t)__p1, 35); 21184 return __ret; 21185 } 21186 #else 21187 __ai __attribute__((target("neon"))) int64x2_t vpadalq_s32(int64x2_t __p0, int32x4_t __p1) { 21188 int64x2_t __ret; 21189 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 21190 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 21191 __ret = (int64x2_t) __builtin_neon_vpadalq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 35); 21192 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 21193 return __ret; 21194 } 21195 #endif 21196 21197 #ifdef __LITTLE_ENDIAN__ 21198 __ai __attribute__((target("neon"))) int32x4_t vpadalq_s16(int32x4_t __p0, int16x8_t __p1) { 21199 int32x4_t __ret; 21200 __ret = (int32x4_t) __builtin_neon_vpadalq_v((int8x16_t)__p0, (int8x16_t)__p1, 34); 21201 return __ret; 21202 } 21203 #else 21204 __ai __attribute__((target("neon"))) int32x4_t vpadalq_s16(int32x4_t __p0, int16x8_t __p1) { 21205 int32x4_t __ret; 21206 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 21207 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 21208 __ret = (int32x4_t) __builtin_neon_vpadalq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34); 21209 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 21210 return __ret; 21211 } 21212 #endif 21213 21214 #ifdef __LITTLE_ENDIAN__ 21215 __ai __attribute__((target("neon"))) uint16x4_t vpadal_u8(uint16x4_t __p0, uint8x8_t __p1) { 21216 uint16x4_t __ret; 21217 __ret = (uint16x4_t) __builtin_neon_vpadal_v((int8x8_t)__p0, (int8x8_t)__p1, 17); 21218 return __ret; 21219 } 21220 #else 21221 __ai __attribute__((target("neon"))) uint16x4_t vpadal_u8(uint16x4_t __p0, uint8x8_t __p1) { 21222 uint16x4_t __ret; 21223 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 21224 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 21225 __ret = (uint16x4_t) __builtin_neon_vpadal_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17); 21226 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 21227 return __ret; 21228 } 21229 #endif 21230 21231 #ifdef __LITTLE_ENDIAN__ 21232 __ai __attribute__((target("neon"))) uint64x1_t vpadal_u32(uint64x1_t __p0, uint32x2_t __p1) { 21233 uint64x1_t __ret; 21234 __ret = (uint64x1_t) __builtin_neon_vpadal_v((int8x8_t)__p0, (int8x8_t)__p1, 19); 21235 return __ret; 21236 } 21237 #else 21238 __ai __attribute__((target("neon"))) uint64x1_t vpadal_u32(uint64x1_t __p0, uint32x2_t __p1) { 21239 uint64x1_t __ret; 21240 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 21241 __ret = (uint64x1_t) __builtin_neon_vpadal_v((int8x8_t)__p0, (int8x8_t)__rev1, 19); 21242 return __ret; 21243 } 21244 #endif 21245 21246 #ifdef __LITTLE_ENDIAN__ 21247 __ai __attribute__((target("neon"))) uint32x2_t vpadal_u16(uint32x2_t __p0, uint16x4_t __p1) { 21248 uint32x2_t __ret; 21249 __ret = (uint32x2_t) __builtin_neon_vpadal_v((int8x8_t)__p0, (int8x8_t)__p1, 18); 21250 return __ret; 21251 } 21252 #else 21253 __ai __attribute__((target("neon"))) uint32x2_t vpadal_u16(uint32x2_t __p0, uint16x4_t __p1) { 21254 uint32x2_t __ret; 21255 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 21256 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 21257 __ret = (uint32x2_t) __builtin_neon_vpadal_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18); 21258 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 21259 return __ret; 21260 } 21261 #endif 21262 21263 #ifdef __LITTLE_ENDIAN__ 21264 __ai __attribute__((target("neon"))) int16x4_t vpadal_s8(int16x4_t __p0, int8x8_t __p1) { 21265 int16x4_t __ret; 21266 __ret = (int16x4_t) __builtin_neon_vpadal_v((int8x8_t)__p0, (int8x8_t)__p1, 1); 21267 return __ret; 21268 } 21269 #else 21270 __ai __attribute__((target("neon"))) int16x4_t vpadal_s8(int16x4_t __p0, int8x8_t __p1) { 21271 int16x4_t __ret; 21272 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 21273 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 21274 __ret = (int16x4_t) __builtin_neon_vpadal_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1); 21275 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 21276 return __ret; 21277 } 21278 #endif 21279 21280 #ifdef __LITTLE_ENDIAN__ 21281 __ai __attribute__((target("neon"))) int64x1_t vpadal_s32(int64x1_t __p0, int32x2_t __p1) { 21282 int64x1_t __ret; 21283 __ret = (int64x1_t) __builtin_neon_vpadal_v((int8x8_t)__p0, (int8x8_t)__p1, 3); 21284 return __ret; 21285 } 21286 #else 21287 __ai __attribute__((target("neon"))) int64x1_t vpadal_s32(int64x1_t __p0, int32x2_t __p1) { 21288 int64x1_t __ret; 21289 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 21290 __ret = (int64x1_t) __builtin_neon_vpadal_v((int8x8_t)__p0, (int8x8_t)__rev1, 3); 21291 return __ret; 21292 } 21293 #endif 21294 21295 #ifdef __LITTLE_ENDIAN__ 21296 __ai __attribute__((target("neon"))) int32x2_t vpadal_s16(int32x2_t __p0, int16x4_t __p1) { 21297 int32x2_t __ret; 21298 __ret = (int32x2_t) __builtin_neon_vpadal_v((int8x8_t)__p0, (int8x8_t)__p1, 2); 21299 return __ret; 21300 } 21301 #else 21302 __ai __attribute__((target("neon"))) int32x2_t vpadal_s16(int32x2_t __p0, int16x4_t __p1) { 21303 int32x2_t __ret; 21304 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 21305 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 21306 __ret = (int32x2_t) __builtin_neon_vpadal_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2); 21307 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 21308 return __ret; 21309 } 21310 #endif 21311 21312 #ifdef __LITTLE_ENDIAN__ 21313 __ai __attribute__((target("neon"))) uint8x8_t vpadd_u8(uint8x8_t __p0, uint8x8_t __p1) { 21314 uint8x8_t __ret; 21315 __ret = (uint8x8_t) __builtin_neon_vpadd_v((int8x8_t)__p0, (int8x8_t)__p1, 16); 21316 return __ret; 21317 } 21318 #else 21319 __ai __attribute__((target("neon"))) uint8x8_t vpadd_u8(uint8x8_t __p0, uint8x8_t __p1) { 21320 uint8x8_t __ret; 21321 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 21322 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 21323 __ret = (uint8x8_t) __builtin_neon_vpadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16); 21324 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 21325 return __ret; 21326 } 21327 #endif 21328 21329 #ifdef __LITTLE_ENDIAN__ 21330 __ai __attribute__((target("neon"))) uint32x2_t vpadd_u32(uint32x2_t __p0, uint32x2_t __p1) { 21331 uint32x2_t __ret; 21332 __ret = (uint32x2_t) __builtin_neon_vpadd_v((int8x8_t)__p0, (int8x8_t)__p1, 18); 21333 return __ret; 21334 } 21335 #else 21336 __ai __attribute__((target("neon"))) uint32x2_t vpadd_u32(uint32x2_t __p0, uint32x2_t __p1) { 21337 uint32x2_t __ret; 21338 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 21339 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 21340 __ret = (uint32x2_t) __builtin_neon_vpadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18); 21341 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 21342 return __ret; 21343 } 21344 #endif 21345 21346 #ifdef __LITTLE_ENDIAN__ 21347 __ai __attribute__((target("neon"))) uint16x4_t vpadd_u16(uint16x4_t __p0, uint16x4_t __p1) { 21348 uint16x4_t __ret; 21349 __ret = (uint16x4_t) __builtin_neon_vpadd_v((int8x8_t)__p0, (int8x8_t)__p1, 17); 21350 return __ret; 21351 } 21352 #else 21353 __ai __attribute__((target("neon"))) uint16x4_t vpadd_u16(uint16x4_t __p0, uint16x4_t __p1) { 21354 uint16x4_t __ret; 21355 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 21356 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 21357 __ret = (uint16x4_t) __builtin_neon_vpadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17); 21358 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 21359 return __ret; 21360 } 21361 #endif 21362 21363 #ifdef __LITTLE_ENDIAN__ 21364 __ai __attribute__((target("neon"))) int8x8_t vpadd_s8(int8x8_t __p0, int8x8_t __p1) { 21365 int8x8_t __ret; 21366 __ret = (int8x8_t) __builtin_neon_vpadd_v((int8x8_t)__p0, (int8x8_t)__p1, 0); 21367 return __ret; 21368 } 21369 #else 21370 __ai __attribute__((target("neon"))) int8x8_t vpadd_s8(int8x8_t __p0, int8x8_t __p1) { 21371 int8x8_t __ret; 21372 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 21373 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 21374 __ret = (int8x8_t) __builtin_neon_vpadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0); 21375 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 21376 return __ret; 21377 } 21378 #endif 21379 21380 #ifdef __LITTLE_ENDIAN__ 21381 __ai __attribute__((target("neon"))) float32x2_t vpadd_f32(float32x2_t __p0, float32x2_t __p1) { 21382 float32x2_t __ret; 21383 __ret = (float32x2_t) __builtin_neon_vpadd_v((int8x8_t)__p0, (int8x8_t)__p1, 9); 21384 return __ret; 21385 } 21386 #else 21387 __ai __attribute__((target("neon"))) float32x2_t vpadd_f32(float32x2_t __p0, float32x2_t __p1) { 21388 float32x2_t __ret; 21389 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 21390 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 21391 __ret = (float32x2_t) __builtin_neon_vpadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 9); 21392 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 21393 return __ret; 21394 } 21395 #endif 21396 21397 #ifdef __LITTLE_ENDIAN__ 21398 __ai __attribute__((target("neon"))) int32x2_t vpadd_s32(int32x2_t __p0, int32x2_t __p1) { 21399 int32x2_t __ret; 21400 __ret = (int32x2_t) __builtin_neon_vpadd_v((int8x8_t)__p0, (int8x8_t)__p1, 2); 21401 return __ret; 21402 } 21403 #else 21404 __ai __attribute__((target("neon"))) int32x2_t vpadd_s32(int32x2_t __p0, int32x2_t __p1) { 21405 int32x2_t __ret; 21406 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 21407 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 21408 __ret = (int32x2_t) __builtin_neon_vpadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2); 21409 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 21410 return __ret; 21411 } 21412 #endif 21413 21414 #ifdef __LITTLE_ENDIAN__ 21415 __ai __attribute__((target("neon"))) int16x4_t vpadd_s16(int16x4_t __p0, int16x4_t __p1) { 21416 int16x4_t __ret; 21417 __ret = (int16x4_t) __builtin_neon_vpadd_v((int8x8_t)__p0, (int8x8_t)__p1, 1); 21418 return __ret; 21419 } 21420 #else 21421 __ai __attribute__((target("neon"))) int16x4_t vpadd_s16(int16x4_t __p0, int16x4_t __p1) { 21422 int16x4_t __ret; 21423 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 21424 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 21425 __ret = (int16x4_t) __builtin_neon_vpadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1); 21426 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 21427 return __ret; 21428 } 21429 #endif 21430 21431 #ifdef __LITTLE_ENDIAN__ 21432 __ai __attribute__((target("neon"))) uint16x8_t vpaddlq_u8(uint8x16_t __p0) { 21433 uint16x8_t __ret; 21434 __ret = (uint16x8_t) __builtin_neon_vpaddlq_v((int8x16_t)__p0, 49); 21435 return __ret; 21436 } 21437 #else 21438 __ai __attribute__((target("neon"))) uint16x8_t vpaddlq_u8(uint8x16_t __p0) { 21439 uint16x8_t __ret; 21440 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 21441 __ret = (uint16x8_t) __builtin_neon_vpaddlq_v((int8x16_t)__rev0, 49); 21442 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 21443 return __ret; 21444 } 21445 #endif 21446 21447 #ifdef __LITTLE_ENDIAN__ 21448 __ai __attribute__((target("neon"))) uint64x2_t vpaddlq_u32(uint32x4_t __p0) { 21449 uint64x2_t __ret; 21450 __ret = (uint64x2_t) __builtin_neon_vpaddlq_v((int8x16_t)__p0, 51); 21451 return __ret; 21452 } 21453 #else 21454 __ai __attribute__((target("neon"))) uint64x2_t vpaddlq_u32(uint32x4_t __p0) { 21455 uint64x2_t __ret; 21456 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 21457 __ret = (uint64x2_t) __builtin_neon_vpaddlq_v((int8x16_t)__rev0, 51); 21458 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 21459 return __ret; 21460 } 21461 #endif 21462 21463 #ifdef __LITTLE_ENDIAN__ 21464 __ai __attribute__((target("neon"))) uint32x4_t vpaddlq_u16(uint16x8_t __p0) { 21465 uint32x4_t __ret; 21466 __ret = (uint32x4_t) __builtin_neon_vpaddlq_v((int8x16_t)__p0, 50); 21467 return __ret; 21468 } 21469 #else 21470 __ai __attribute__((target("neon"))) uint32x4_t vpaddlq_u16(uint16x8_t __p0) { 21471 uint32x4_t __ret; 21472 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 21473 __ret = (uint32x4_t) __builtin_neon_vpaddlq_v((int8x16_t)__rev0, 50); 21474 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 21475 return __ret; 21476 } 21477 #endif 21478 21479 #ifdef __LITTLE_ENDIAN__ 21480 __ai __attribute__((target("neon"))) int16x8_t vpaddlq_s8(int8x16_t __p0) { 21481 int16x8_t __ret; 21482 __ret = (int16x8_t) __builtin_neon_vpaddlq_v((int8x16_t)__p0, 33); 21483 return __ret; 21484 } 21485 #else 21486 __ai __attribute__((target("neon"))) int16x8_t vpaddlq_s8(int8x16_t __p0) { 21487 int16x8_t __ret; 21488 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 21489 __ret = (int16x8_t) __builtin_neon_vpaddlq_v((int8x16_t)__rev0, 33); 21490 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 21491 return __ret; 21492 } 21493 #endif 21494 21495 #ifdef __LITTLE_ENDIAN__ 21496 __ai __attribute__((target("neon"))) int64x2_t vpaddlq_s32(int32x4_t __p0) { 21497 int64x2_t __ret; 21498 __ret = (int64x2_t) __builtin_neon_vpaddlq_v((int8x16_t)__p0, 35); 21499 return __ret; 21500 } 21501 #else 21502 __ai __attribute__((target("neon"))) int64x2_t vpaddlq_s32(int32x4_t __p0) { 21503 int64x2_t __ret; 21504 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 21505 __ret = (int64x2_t) __builtin_neon_vpaddlq_v((int8x16_t)__rev0, 35); 21506 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 21507 return __ret; 21508 } 21509 #endif 21510 21511 #ifdef __LITTLE_ENDIAN__ 21512 __ai __attribute__((target("neon"))) int32x4_t vpaddlq_s16(int16x8_t __p0) { 21513 int32x4_t __ret; 21514 __ret = (int32x4_t) __builtin_neon_vpaddlq_v((int8x16_t)__p0, 34); 21515 return __ret; 21516 } 21517 #else 21518 __ai __attribute__((target("neon"))) int32x4_t vpaddlq_s16(int16x8_t __p0) { 21519 int32x4_t __ret; 21520 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 21521 __ret = (int32x4_t) __builtin_neon_vpaddlq_v((int8x16_t)__rev0, 34); 21522 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 21523 return __ret; 21524 } 21525 #endif 21526 21527 #ifdef __LITTLE_ENDIAN__ 21528 __ai __attribute__((target("neon"))) uint16x4_t vpaddl_u8(uint8x8_t __p0) { 21529 uint16x4_t __ret; 21530 __ret = (uint16x4_t) __builtin_neon_vpaddl_v((int8x8_t)__p0, 17); 21531 return __ret; 21532 } 21533 #else 21534 __ai __attribute__((target("neon"))) uint16x4_t vpaddl_u8(uint8x8_t __p0) { 21535 uint16x4_t __ret; 21536 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 21537 __ret = (uint16x4_t) __builtin_neon_vpaddl_v((int8x8_t)__rev0, 17); 21538 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 21539 return __ret; 21540 } 21541 #endif 21542 21543 #ifdef __LITTLE_ENDIAN__ 21544 __ai __attribute__((target("neon"))) uint64x1_t vpaddl_u32(uint32x2_t __p0) { 21545 uint64x1_t __ret; 21546 __ret = (uint64x1_t) __builtin_neon_vpaddl_v((int8x8_t)__p0, 19); 21547 return __ret; 21548 } 21549 #else 21550 __ai __attribute__((target("neon"))) uint64x1_t vpaddl_u32(uint32x2_t __p0) { 21551 uint64x1_t __ret; 21552 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 21553 __ret = (uint64x1_t) __builtin_neon_vpaddl_v((int8x8_t)__rev0, 19); 21554 return __ret; 21555 } 21556 #endif 21557 21558 #ifdef __LITTLE_ENDIAN__ 21559 __ai __attribute__((target("neon"))) uint32x2_t vpaddl_u16(uint16x4_t __p0) { 21560 uint32x2_t __ret; 21561 __ret = (uint32x2_t) __builtin_neon_vpaddl_v((int8x8_t)__p0, 18); 21562 return __ret; 21563 } 21564 #else 21565 __ai __attribute__((target("neon"))) uint32x2_t vpaddl_u16(uint16x4_t __p0) { 21566 uint32x2_t __ret; 21567 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 21568 __ret = (uint32x2_t) __builtin_neon_vpaddl_v((int8x8_t)__rev0, 18); 21569 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 21570 return __ret; 21571 } 21572 #endif 21573 21574 #ifdef __LITTLE_ENDIAN__ 21575 __ai __attribute__((target("neon"))) int16x4_t vpaddl_s8(int8x8_t __p0) { 21576 int16x4_t __ret; 21577 __ret = (int16x4_t) __builtin_neon_vpaddl_v((int8x8_t)__p0, 1); 21578 return __ret; 21579 } 21580 #else 21581 __ai __attribute__((target("neon"))) int16x4_t vpaddl_s8(int8x8_t __p0) { 21582 int16x4_t __ret; 21583 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 21584 __ret = (int16x4_t) __builtin_neon_vpaddl_v((int8x8_t)__rev0, 1); 21585 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 21586 return __ret; 21587 } 21588 #endif 21589 21590 #ifdef __LITTLE_ENDIAN__ 21591 __ai __attribute__((target("neon"))) int64x1_t vpaddl_s32(int32x2_t __p0) { 21592 int64x1_t __ret; 21593 __ret = (int64x1_t) __builtin_neon_vpaddl_v((int8x8_t)__p0, 3); 21594 return __ret; 21595 } 21596 #else 21597 __ai __attribute__((target("neon"))) int64x1_t vpaddl_s32(int32x2_t __p0) { 21598 int64x1_t __ret; 21599 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 21600 __ret = (int64x1_t) __builtin_neon_vpaddl_v((int8x8_t)__rev0, 3); 21601 return __ret; 21602 } 21603 #endif 21604 21605 #ifdef __LITTLE_ENDIAN__ 21606 __ai __attribute__((target("neon"))) int32x2_t vpaddl_s16(int16x4_t __p0) { 21607 int32x2_t __ret; 21608 __ret = (int32x2_t) __builtin_neon_vpaddl_v((int8x8_t)__p0, 2); 21609 return __ret; 21610 } 21611 #else 21612 __ai __attribute__((target("neon"))) int32x2_t vpaddl_s16(int16x4_t __p0) { 21613 int32x2_t __ret; 21614 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 21615 __ret = (int32x2_t) __builtin_neon_vpaddl_v((int8x8_t)__rev0, 2); 21616 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 21617 return __ret; 21618 } 21619 #endif 21620 21621 #ifdef __LITTLE_ENDIAN__ 21622 __ai __attribute__((target("neon"))) uint8x8_t vpmax_u8(uint8x8_t __p0, uint8x8_t __p1) { 21623 uint8x8_t __ret; 21624 __ret = (uint8x8_t) __builtin_neon_vpmax_v((int8x8_t)__p0, (int8x8_t)__p1, 16); 21625 return __ret; 21626 } 21627 #else 21628 __ai __attribute__((target("neon"))) uint8x8_t vpmax_u8(uint8x8_t __p0, uint8x8_t __p1) { 21629 uint8x8_t __ret; 21630 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 21631 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 21632 __ret = (uint8x8_t) __builtin_neon_vpmax_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16); 21633 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 21634 return __ret; 21635 } 21636 #endif 21637 21638 #ifdef __LITTLE_ENDIAN__ 21639 __ai __attribute__((target("neon"))) uint32x2_t vpmax_u32(uint32x2_t __p0, uint32x2_t __p1) { 21640 uint32x2_t __ret; 21641 __ret = (uint32x2_t) __builtin_neon_vpmax_v((int8x8_t)__p0, (int8x8_t)__p1, 18); 21642 return __ret; 21643 } 21644 #else 21645 __ai __attribute__((target("neon"))) uint32x2_t vpmax_u32(uint32x2_t __p0, uint32x2_t __p1) { 21646 uint32x2_t __ret; 21647 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 21648 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 21649 __ret = (uint32x2_t) __builtin_neon_vpmax_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18); 21650 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 21651 return __ret; 21652 } 21653 #endif 21654 21655 #ifdef __LITTLE_ENDIAN__ 21656 __ai __attribute__((target("neon"))) uint16x4_t vpmax_u16(uint16x4_t __p0, uint16x4_t __p1) { 21657 uint16x4_t __ret; 21658 __ret = (uint16x4_t) __builtin_neon_vpmax_v((int8x8_t)__p0, (int8x8_t)__p1, 17); 21659 return __ret; 21660 } 21661 #else 21662 __ai __attribute__((target("neon"))) uint16x4_t vpmax_u16(uint16x4_t __p0, uint16x4_t __p1) { 21663 uint16x4_t __ret; 21664 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 21665 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 21666 __ret = (uint16x4_t) __builtin_neon_vpmax_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17); 21667 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 21668 return __ret; 21669 } 21670 #endif 21671 21672 #ifdef __LITTLE_ENDIAN__ 21673 __ai __attribute__((target("neon"))) int8x8_t vpmax_s8(int8x8_t __p0, int8x8_t __p1) { 21674 int8x8_t __ret; 21675 __ret = (int8x8_t) __builtin_neon_vpmax_v((int8x8_t)__p0, (int8x8_t)__p1, 0); 21676 return __ret; 21677 } 21678 #else 21679 __ai __attribute__((target("neon"))) int8x8_t vpmax_s8(int8x8_t __p0, int8x8_t __p1) { 21680 int8x8_t __ret; 21681 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 21682 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 21683 __ret = (int8x8_t) __builtin_neon_vpmax_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0); 21684 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 21685 return __ret; 21686 } 21687 #endif 21688 21689 #ifdef __LITTLE_ENDIAN__ 21690 __ai __attribute__((target("neon"))) float32x2_t vpmax_f32(float32x2_t __p0, float32x2_t __p1) { 21691 float32x2_t __ret; 21692 __ret = (float32x2_t) __builtin_neon_vpmax_v((int8x8_t)__p0, (int8x8_t)__p1, 9); 21693 return __ret; 21694 } 21695 #else 21696 __ai __attribute__((target("neon"))) float32x2_t vpmax_f32(float32x2_t __p0, float32x2_t __p1) { 21697 float32x2_t __ret; 21698 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 21699 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 21700 __ret = (float32x2_t) __builtin_neon_vpmax_v((int8x8_t)__rev0, (int8x8_t)__rev1, 9); 21701 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 21702 return __ret; 21703 } 21704 #endif 21705 21706 #ifdef __LITTLE_ENDIAN__ 21707 __ai __attribute__((target("neon"))) int32x2_t vpmax_s32(int32x2_t __p0, int32x2_t __p1) { 21708 int32x2_t __ret; 21709 __ret = (int32x2_t) __builtin_neon_vpmax_v((int8x8_t)__p0, (int8x8_t)__p1, 2); 21710 return __ret; 21711 } 21712 #else 21713 __ai __attribute__((target("neon"))) int32x2_t vpmax_s32(int32x2_t __p0, int32x2_t __p1) { 21714 int32x2_t __ret; 21715 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 21716 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 21717 __ret = (int32x2_t) __builtin_neon_vpmax_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2); 21718 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 21719 return __ret; 21720 } 21721 #endif 21722 21723 #ifdef __LITTLE_ENDIAN__ 21724 __ai __attribute__((target("neon"))) int16x4_t vpmax_s16(int16x4_t __p0, int16x4_t __p1) { 21725 int16x4_t __ret; 21726 __ret = (int16x4_t) __builtin_neon_vpmax_v((int8x8_t)__p0, (int8x8_t)__p1, 1); 21727 return __ret; 21728 } 21729 #else 21730 __ai __attribute__((target("neon"))) int16x4_t vpmax_s16(int16x4_t __p0, int16x4_t __p1) { 21731 int16x4_t __ret; 21732 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 21733 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 21734 __ret = (int16x4_t) __builtin_neon_vpmax_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1); 21735 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 21736 return __ret; 21737 } 21738 #endif 21739 21740 #ifdef __LITTLE_ENDIAN__ 21741 __ai __attribute__((target("neon"))) uint8x8_t vpmin_u8(uint8x8_t __p0, uint8x8_t __p1) { 21742 uint8x8_t __ret; 21743 __ret = (uint8x8_t) __builtin_neon_vpmin_v((int8x8_t)__p0, (int8x8_t)__p1, 16); 21744 return __ret; 21745 } 21746 #else 21747 __ai __attribute__((target("neon"))) uint8x8_t vpmin_u8(uint8x8_t __p0, uint8x8_t __p1) { 21748 uint8x8_t __ret; 21749 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 21750 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 21751 __ret = (uint8x8_t) __builtin_neon_vpmin_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16); 21752 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 21753 return __ret; 21754 } 21755 #endif 21756 21757 #ifdef __LITTLE_ENDIAN__ 21758 __ai __attribute__((target("neon"))) uint32x2_t vpmin_u32(uint32x2_t __p0, uint32x2_t __p1) { 21759 uint32x2_t __ret; 21760 __ret = (uint32x2_t) __builtin_neon_vpmin_v((int8x8_t)__p0, (int8x8_t)__p1, 18); 21761 return __ret; 21762 } 21763 #else 21764 __ai __attribute__((target("neon"))) uint32x2_t vpmin_u32(uint32x2_t __p0, uint32x2_t __p1) { 21765 uint32x2_t __ret; 21766 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 21767 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 21768 __ret = (uint32x2_t) __builtin_neon_vpmin_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18); 21769 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 21770 return __ret; 21771 } 21772 #endif 21773 21774 #ifdef __LITTLE_ENDIAN__ 21775 __ai __attribute__((target("neon"))) uint16x4_t vpmin_u16(uint16x4_t __p0, uint16x4_t __p1) { 21776 uint16x4_t __ret; 21777 __ret = (uint16x4_t) __builtin_neon_vpmin_v((int8x8_t)__p0, (int8x8_t)__p1, 17); 21778 return __ret; 21779 } 21780 #else 21781 __ai __attribute__((target("neon"))) uint16x4_t vpmin_u16(uint16x4_t __p0, uint16x4_t __p1) { 21782 uint16x4_t __ret; 21783 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 21784 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 21785 __ret = (uint16x4_t) __builtin_neon_vpmin_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17); 21786 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 21787 return __ret; 21788 } 21789 #endif 21790 21791 #ifdef __LITTLE_ENDIAN__ 21792 __ai __attribute__((target("neon"))) int8x8_t vpmin_s8(int8x8_t __p0, int8x8_t __p1) { 21793 int8x8_t __ret; 21794 __ret = (int8x8_t) __builtin_neon_vpmin_v((int8x8_t)__p0, (int8x8_t)__p1, 0); 21795 return __ret; 21796 } 21797 #else 21798 __ai __attribute__((target("neon"))) int8x8_t vpmin_s8(int8x8_t __p0, int8x8_t __p1) { 21799 int8x8_t __ret; 21800 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 21801 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 21802 __ret = (int8x8_t) __builtin_neon_vpmin_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0); 21803 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 21804 return __ret; 21805 } 21806 #endif 21807 21808 #ifdef __LITTLE_ENDIAN__ 21809 __ai __attribute__((target("neon"))) float32x2_t vpmin_f32(float32x2_t __p0, float32x2_t __p1) { 21810 float32x2_t __ret; 21811 __ret = (float32x2_t) __builtin_neon_vpmin_v((int8x8_t)__p0, (int8x8_t)__p1, 9); 21812 return __ret; 21813 } 21814 #else 21815 __ai __attribute__((target("neon"))) float32x2_t vpmin_f32(float32x2_t __p0, float32x2_t __p1) { 21816 float32x2_t __ret; 21817 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 21818 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 21819 __ret = (float32x2_t) __builtin_neon_vpmin_v((int8x8_t)__rev0, (int8x8_t)__rev1, 9); 21820 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 21821 return __ret; 21822 } 21823 #endif 21824 21825 #ifdef __LITTLE_ENDIAN__ 21826 __ai __attribute__((target("neon"))) int32x2_t vpmin_s32(int32x2_t __p0, int32x2_t __p1) { 21827 int32x2_t __ret; 21828 __ret = (int32x2_t) __builtin_neon_vpmin_v((int8x8_t)__p0, (int8x8_t)__p1, 2); 21829 return __ret; 21830 } 21831 #else 21832 __ai __attribute__((target("neon"))) int32x2_t vpmin_s32(int32x2_t __p0, int32x2_t __p1) { 21833 int32x2_t __ret; 21834 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 21835 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 21836 __ret = (int32x2_t) __builtin_neon_vpmin_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2); 21837 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 21838 return __ret; 21839 } 21840 #endif 21841 21842 #ifdef __LITTLE_ENDIAN__ 21843 __ai __attribute__((target("neon"))) int16x4_t vpmin_s16(int16x4_t __p0, int16x4_t __p1) { 21844 int16x4_t __ret; 21845 __ret = (int16x4_t) __builtin_neon_vpmin_v((int8x8_t)__p0, (int8x8_t)__p1, 1); 21846 return __ret; 21847 } 21848 #else 21849 __ai __attribute__((target("neon"))) int16x4_t vpmin_s16(int16x4_t __p0, int16x4_t __p1) { 21850 int16x4_t __ret; 21851 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 21852 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 21853 __ret = (int16x4_t) __builtin_neon_vpmin_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1); 21854 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 21855 return __ret; 21856 } 21857 #endif 21858 21859 #ifdef __LITTLE_ENDIAN__ 21860 __ai __attribute__((target("neon"))) int8x16_t vqabsq_s8(int8x16_t __p0) { 21861 int8x16_t __ret; 21862 __ret = (int8x16_t) __builtin_neon_vqabsq_v((int8x16_t)__p0, 32); 21863 return __ret; 21864 } 21865 #else 21866 __ai __attribute__((target("neon"))) int8x16_t vqabsq_s8(int8x16_t __p0) { 21867 int8x16_t __ret; 21868 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 21869 __ret = (int8x16_t) __builtin_neon_vqabsq_v((int8x16_t)__rev0, 32); 21870 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 21871 return __ret; 21872 } 21873 #endif 21874 21875 #ifdef __LITTLE_ENDIAN__ 21876 __ai __attribute__((target("neon"))) int32x4_t vqabsq_s32(int32x4_t __p0) { 21877 int32x4_t __ret; 21878 __ret = (int32x4_t) __builtin_neon_vqabsq_v((int8x16_t)__p0, 34); 21879 return __ret; 21880 } 21881 #else 21882 __ai __attribute__((target("neon"))) int32x4_t vqabsq_s32(int32x4_t __p0) { 21883 int32x4_t __ret; 21884 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 21885 __ret = (int32x4_t) __builtin_neon_vqabsq_v((int8x16_t)__rev0, 34); 21886 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 21887 return __ret; 21888 } 21889 #endif 21890 21891 #ifdef __LITTLE_ENDIAN__ 21892 __ai __attribute__((target("neon"))) int16x8_t vqabsq_s16(int16x8_t __p0) { 21893 int16x8_t __ret; 21894 __ret = (int16x8_t) __builtin_neon_vqabsq_v((int8x16_t)__p0, 33); 21895 return __ret; 21896 } 21897 #else 21898 __ai __attribute__((target("neon"))) int16x8_t vqabsq_s16(int16x8_t __p0) { 21899 int16x8_t __ret; 21900 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 21901 __ret = (int16x8_t) __builtin_neon_vqabsq_v((int8x16_t)__rev0, 33); 21902 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 21903 return __ret; 21904 } 21905 #endif 21906 21907 #ifdef __LITTLE_ENDIAN__ 21908 __ai __attribute__((target("neon"))) int8x8_t vqabs_s8(int8x8_t __p0) { 21909 int8x8_t __ret; 21910 __ret = (int8x8_t) __builtin_neon_vqabs_v((int8x8_t)__p0, 0); 21911 return __ret; 21912 } 21913 #else 21914 __ai __attribute__((target("neon"))) int8x8_t vqabs_s8(int8x8_t __p0) { 21915 int8x8_t __ret; 21916 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 21917 __ret = (int8x8_t) __builtin_neon_vqabs_v((int8x8_t)__rev0, 0); 21918 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 21919 return __ret; 21920 } 21921 #endif 21922 21923 #ifdef __LITTLE_ENDIAN__ 21924 __ai __attribute__((target("neon"))) int32x2_t vqabs_s32(int32x2_t __p0) { 21925 int32x2_t __ret; 21926 __ret = (int32x2_t) __builtin_neon_vqabs_v((int8x8_t)__p0, 2); 21927 return __ret; 21928 } 21929 #else 21930 __ai __attribute__((target("neon"))) int32x2_t vqabs_s32(int32x2_t __p0) { 21931 int32x2_t __ret; 21932 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 21933 __ret = (int32x2_t) __builtin_neon_vqabs_v((int8x8_t)__rev0, 2); 21934 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 21935 return __ret; 21936 } 21937 #endif 21938 21939 #ifdef __LITTLE_ENDIAN__ 21940 __ai __attribute__((target("neon"))) int16x4_t vqabs_s16(int16x4_t __p0) { 21941 int16x4_t __ret; 21942 __ret = (int16x4_t) __builtin_neon_vqabs_v((int8x8_t)__p0, 1); 21943 return __ret; 21944 } 21945 #else 21946 __ai __attribute__((target("neon"))) int16x4_t vqabs_s16(int16x4_t __p0) { 21947 int16x4_t __ret; 21948 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 21949 __ret = (int16x4_t) __builtin_neon_vqabs_v((int8x8_t)__rev0, 1); 21950 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 21951 return __ret; 21952 } 21953 #endif 21954 21955 #ifdef __LITTLE_ENDIAN__ 21956 __ai __attribute__((target("neon"))) uint8x16_t vqaddq_u8(uint8x16_t __p0, uint8x16_t __p1) { 21957 uint8x16_t __ret; 21958 __ret = (uint8x16_t) __builtin_neon_vqaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 48); 21959 return __ret; 21960 } 21961 #else 21962 __ai __attribute__((target("neon"))) uint8x16_t vqaddq_u8(uint8x16_t __p0, uint8x16_t __p1) { 21963 uint8x16_t __ret; 21964 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 21965 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 21966 __ret = (uint8x16_t) __builtin_neon_vqaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48); 21967 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 21968 return __ret; 21969 } 21970 #endif 21971 21972 #ifdef __LITTLE_ENDIAN__ 21973 __ai __attribute__((target("neon"))) uint32x4_t vqaddq_u32(uint32x4_t __p0, uint32x4_t __p1) { 21974 uint32x4_t __ret; 21975 __ret = (uint32x4_t) __builtin_neon_vqaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 50); 21976 return __ret; 21977 } 21978 #else 21979 __ai __attribute__((target("neon"))) uint32x4_t vqaddq_u32(uint32x4_t __p0, uint32x4_t __p1) { 21980 uint32x4_t __ret; 21981 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 21982 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 21983 __ret = (uint32x4_t) __builtin_neon_vqaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50); 21984 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 21985 return __ret; 21986 } 21987 #endif 21988 21989 #ifdef __LITTLE_ENDIAN__ 21990 __ai __attribute__((target("neon"))) uint64x2_t vqaddq_u64(uint64x2_t __p0, uint64x2_t __p1) { 21991 uint64x2_t __ret; 21992 __ret = (uint64x2_t) __builtin_neon_vqaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 51); 21993 return __ret; 21994 } 21995 #else 21996 __ai __attribute__((target("neon"))) uint64x2_t vqaddq_u64(uint64x2_t __p0, uint64x2_t __p1) { 21997 uint64x2_t __ret; 21998 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 21999 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 22000 __ret = (uint64x2_t) __builtin_neon_vqaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 51); 22001 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 22002 return __ret; 22003 } 22004 #endif 22005 22006 #ifdef __LITTLE_ENDIAN__ 22007 __ai __attribute__((target("neon"))) uint16x8_t vqaddq_u16(uint16x8_t __p0, uint16x8_t __p1) { 22008 uint16x8_t __ret; 22009 __ret = (uint16x8_t) __builtin_neon_vqaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 49); 22010 return __ret; 22011 } 22012 #else 22013 __ai __attribute__((target("neon"))) uint16x8_t vqaddq_u16(uint16x8_t __p0, uint16x8_t __p1) { 22014 uint16x8_t __ret; 22015 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 22016 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 22017 __ret = (uint16x8_t) __builtin_neon_vqaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49); 22018 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 22019 return __ret; 22020 } 22021 #endif 22022 22023 #ifdef __LITTLE_ENDIAN__ 22024 __ai __attribute__((target("neon"))) int8x16_t vqaddq_s8(int8x16_t __p0, int8x16_t __p1) { 22025 int8x16_t __ret; 22026 __ret = (int8x16_t) __builtin_neon_vqaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 32); 22027 return __ret; 22028 } 22029 #else 22030 __ai __attribute__((target("neon"))) int8x16_t vqaddq_s8(int8x16_t __p0, int8x16_t __p1) { 22031 int8x16_t __ret; 22032 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 22033 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 22034 __ret = (int8x16_t) __builtin_neon_vqaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32); 22035 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 22036 return __ret; 22037 } 22038 #endif 22039 22040 #ifdef __LITTLE_ENDIAN__ 22041 __ai __attribute__((target("neon"))) int32x4_t vqaddq_s32(int32x4_t __p0, int32x4_t __p1) { 22042 int32x4_t __ret; 22043 __ret = (int32x4_t) __builtin_neon_vqaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 34); 22044 return __ret; 22045 } 22046 #else 22047 __ai __attribute__((target("neon"))) int32x4_t vqaddq_s32(int32x4_t __p0, int32x4_t __p1) { 22048 int32x4_t __ret; 22049 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 22050 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 22051 __ret = (int32x4_t) __builtin_neon_vqaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34); 22052 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 22053 return __ret; 22054 } 22055 #endif 22056 22057 #ifdef __LITTLE_ENDIAN__ 22058 __ai __attribute__((target("neon"))) int64x2_t vqaddq_s64(int64x2_t __p0, int64x2_t __p1) { 22059 int64x2_t __ret; 22060 __ret = (int64x2_t) __builtin_neon_vqaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 35); 22061 return __ret; 22062 } 22063 #else 22064 __ai __attribute__((target("neon"))) int64x2_t vqaddq_s64(int64x2_t __p0, int64x2_t __p1) { 22065 int64x2_t __ret; 22066 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 22067 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 22068 __ret = (int64x2_t) __builtin_neon_vqaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 35); 22069 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 22070 return __ret; 22071 } 22072 #endif 22073 22074 #ifdef __LITTLE_ENDIAN__ 22075 __ai __attribute__((target("neon"))) int16x8_t vqaddq_s16(int16x8_t __p0, int16x8_t __p1) { 22076 int16x8_t __ret; 22077 __ret = (int16x8_t) __builtin_neon_vqaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 33); 22078 return __ret; 22079 } 22080 #else 22081 __ai __attribute__((target("neon"))) int16x8_t vqaddq_s16(int16x8_t __p0, int16x8_t __p1) { 22082 int16x8_t __ret; 22083 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 22084 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 22085 __ret = (int16x8_t) __builtin_neon_vqaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33); 22086 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 22087 return __ret; 22088 } 22089 #endif 22090 22091 #ifdef __LITTLE_ENDIAN__ 22092 __ai __attribute__((target("neon"))) uint8x8_t vqadd_u8(uint8x8_t __p0, uint8x8_t __p1) { 22093 uint8x8_t __ret; 22094 __ret = (uint8x8_t) __builtin_neon_vqadd_v((int8x8_t)__p0, (int8x8_t)__p1, 16); 22095 return __ret; 22096 } 22097 #else 22098 __ai __attribute__((target("neon"))) uint8x8_t vqadd_u8(uint8x8_t __p0, uint8x8_t __p1) { 22099 uint8x8_t __ret; 22100 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 22101 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 22102 __ret = (uint8x8_t) __builtin_neon_vqadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16); 22103 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 22104 return __ret; 22105 } 22106 #endif 22107 22108 #ifdef __LITTLE_ENDIAN__ 22109 __ai __attribute__((target("neon"))) uint32x2_t vqadd_u32(uint32x2_t __p0, uint32x2_t __p1) { 22110 uint32x2_t __ret; 22111 __ret = (uint32x2_t) __builtin_neon_vqadd_v((int8x8_t)__p0, (int8x8_t)__p1, 18); 22112 return __ret; 22113 } 22114 #else 22115 __ai __attribute__((target("neon"))) uint32x2_t vqadd_u32(uint32x2_t __p0, uint32x2_t __p1) { 22116 uint32x2_t __ret; 22117 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 22118 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 22119 __ret = (uint32x2_t) __builtin_neon_vqadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18); 22120 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 22121 return __ret; 22122 } 22123 #endif 22124 22125 __ai __attribute__((target("neon"))) uint64x1_t vqadd_u64(uint64x1_t __p0, uint64x1_t __p1) { 22126 uint64x1_t __ret; 22127 __ret = (uint64x1_t) __builtin_neon_vqadd_v((int8x8_t)__p0, (int8x8_t)__p1, 19); 22128 return __ret; 22129 } 22130 #ifdef __LITTLE_ENDIAN__ 22131 __ai __attribute__((target("neon"))) uint16x4_t vqadd_u16(uint16x4_t __p0, uint16x4_t __p1) { 22132 uint16x4_t __ret; 22133 __ret = (uint16x4_t) __builtin_neon_vqadd_v((int8x8_t)__p0, (int8x8_t)__p1, 17); 22134 return __ret; 22135 } 22136 #else 22137 __ai __attribute__((target("neon"))) uint16x4_t vqadd_u16(uint16x4_t __p0, uint16x4_t __p1) { 22138 uint16x4_t __ret; 22139 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 22140 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 22141 __ret = (uint16x4_t) __builtin_neon_vqadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17); 22142 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 22143 return __ret; 22144 } 22145 #endif 22146 22147 #ifdef __LITTLE_ENDIAN__ 22148 __ai __attribute__((target("neon"))) int8x8_t vqadd_s8(int8x8_t __p0, int8x8_t __p1) { 22149 int8x8_t __ret; 22150 __ret = (int8x8_t) __builtin_neon_vqadd_v((int8x8_t)__p0, (int8x8_t)__p1, 0); 22151 return __ret; 22152 } 22153 #else 22154 __ai __attribute__((target("neon"))) int8x8_t vqadd_s8(int8x8_t __p0, int8x8_t __p1) { 22155 int8x8_t __ret; 22156 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 22157 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 22158 __ret = (int8x8_t) __builtin_neon_vqadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0); 22159 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 22160 return __ret; 22161 } 22162 #endif 22163 22164 #ifdef __LITTLE_ENDIAN__ 22165 __ai __attribute__((target("neon"))) int32x2_t vqadd_s32(int32x2_t __p0, int32x2_t __p1) { 22166 int32x2_t __ret; 22167 __ret = (int32x2_t) __builtin_neon_vqadd_v((int8x8_t)__p0, (int8x8_t)__p1, 2); 22168 return __ret; 22169 } 22170 #else 22171 __ai __attribute__((target("neon"))) int32x2_t vqadd_s32(int32x2_t __p0, int32x2_t __p1) { 22172 int32x2_t __ret; 22173 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 22174 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 22175 __ret = (int32x2_t) __builtin_neon_vqadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2); 22176 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 22177 return __ret; 22178 } 22179 #endif 22180 22181 __ai __attribute__((target("neon"))) int64x1_t vqadd_s64(int64x1_t __p0, int64x1_t __p1) { 22182 int64x1_t __ret; 22183 __ret = (int64x1_t) __builtin_neon_vqadd_v((int8x8_t)__p0, (int8x8_t)__p1, 3); 22184 return __ret; 22185 } 22186 #ifdef __LITTLE_ENDIAN__ 22187 __ai __attribute__((target("neon"))) int16x4_t vqadd_s16(int16x4_t __p0, int16x4_t __p1) { 22188 int16x4_t __ret; 22189 __ret = (int16x4_t) __builtin_neon_vqadd_v((int8x8_t)__p0, (int8x8_t)__p1, 1); 22190 return __ret; 22191 } 22192 #else 22193 __ai __attribute__((target("neon"))) int16x4_t vqadd_s16(int16x4_t __p0, int16x4_t __p1) { 22194 int16x4_t __ret; 22195 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 22196 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 22197 __ret = (int16x4_t) __builtin_neon_vqadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1); 22198 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 22199 return __ret; 22200 } 22201 #endif 22202 22203 #ifdef __LITTLE_ENDIAN__ 22204 __ai __attribute__((target("neon"))) int64x2_t vqdmlal_s32(int64x2_t __p0, int32x2_t __p1, int32x2_t __p2) { 22205 int64x2_t __ret; 22206 __ret = (int64x2_t) __builtin_neon_vqdmlal_v((int8x16_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 35); 22207 return __ret; 22208 } 22209 #else 22210 __ai __attribute__((target("neon"))) int64x2_t vqdmlal_s32(int64x2_t __p0, int32x2_t __p1, int32x2_t __p2) { 22211 int64x2_t __ret; 22212 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 22213 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 22214 int32x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 22215 __ret = (int64x2_t) __builtin_neon_vqdmlal_v((int8x16_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 35); 22216 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 22217 return __ret; 22218 } 22219 __ai __attribute__((target("neon"))) int64x2_t __noswap_vqdmlal_s32(int64x2_t __p0, int32x2_t __p1, int32x2_t __p2) { 22220 int64x2_t __ret; 22221 __ret = (int64x2_t) __builtin_neon_vqdmlal_v((int8x16_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 35); 22222 return __ret; 22223 } 22224 #endif 22225 22226 #ifdef __LITTLE_ENDIAN__ 22227 __ai __attribute__((target("neon"))) int32x4_t vqdmlal_s16(int32x4_t __p0, int16x4_t __p1, int16x4_t __p2) { 22228 int32x4_t __ret; 22229 __ret = (int32x4_t) __builtin_neon_vqdmlal_v((int8x16_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 34); 22230 return __ret; 22231 } 22232 #else 22233 __ai __attribute__((target("neon"))) int32x4_t vqdmlal_s16(int32x4_t __p0, int16x4_t __p1, int16x4_t __p2) { 22234 int32x4_t __ret; 22235 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 22236 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 22237 int16x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 22238 __ret = (int32x4_t) __builtin_neon_vqdmlal_v((int8x16_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 34); 22239 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 22240 return __ret; 22241 } 22242 __ai __attribute__((target("neon"))) int32x4_t __noswap_vqdmlal_s16(int32x4_t __p0, int16x4_t __p1, int16x4_t __p2) { 22243 int32x4_t __ret; 22244 __ret = (int32x4_t) __builtin_neon_vqdmlal_v((int8x16_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 34); 22245 return __ret; 22246 } 22247 #endif 22248 22249 #ifdef __LITTLE_ENDIAN__ 22250 #define vqdmlal_lane_s32(__p0_122, __p1_122, __p2_122, __p3_122) __extension__ ({ \ 22251 int64x2_t __ret_122; \ 22252 int64x2_t __s0_122 = __p0_122; \ 22253 int32x2_t __s1_122 = __p1_122; \ 22254 int32x2_t __s2_122 = __p2_122; \ 22255 __ret_122 = vqdmlal_s32(__s0_122, __s1_122, splat_lane_s32(__s2_122, __p3_122)); \ 22256 __ret_122; \ 22257 }) 22258 #else 22259 #define vqdmlal_lane_s32(__p0_123, __p1_123, __p2_123, __p3_123) __extension__ ({ \ 22260 int64x2_t __ret_123; \ 22261 int64x2_t __s0_123 = __p0_123; \ 22262 int32x2_t __s1_123 = __p1_123; \ 22263 int32x2_t __s2_123 = __p2_123; \ 22264 int64x2_t __rev0_123; __rev0_123 = __builtin_shufflevector(__s0_123, __s0_123, 1, 0); \ 22265 int32x2_t __rev1_123; __rev1_123 = __builtin_shufflevector(__s1_123, __s1_123, 1, 0); \ 22266 int32x2_t __rev2_123; __rev2_123 = __builtin_shufflevector(__s2_123, __s2_123, 1, 0); \ 22267 __ret_123 = __noswap_vqdmlal_s32(__rev0_123, __rev1_123, __noswap_splat_lane_s32(__rev2_123, __p3_123)); \ 22268 __ret_123 = __builtin_shufflevector(__ret_123, __ret_123, 1, 0); \ 22269 __ret_123; \ 22270 }) 22271 #endif 22272 22273 #ifdef __LITTLE_ENDIAN__ 22274 #define vqdmlal_lane_s16(__p0_124, __p1_124, __p2_124, __p3_124) __extension__ ({ \ 22275 int32x4_t __ret_124; \ 22276 int32x4_t __s0_124 = __p0_124; \ 22277 int16x4_t __s1_124 = __p1_124; \ 22278 int16x4_t __s2_124 = __p2_124; \ 22279 __ret_124 = vqdmlal_s16(__s0_124, __s1_124, splat_lane_s16(__s2_124, __p3_124)); \ 22280 __ret_124; \ 22281 }) 22282 #else 22283 #define vqdmlal_lane_s16(__p0_125, __p1_125, __p2_125, __p3_125) __extension__ ({ \ 22284 int32x4_t __ret_125; \ 22285 int32x4_t __s0_125 = __p0_125; \ 22286 int16x4_t __s1_125 = __p1_125; \ 22287 int16x4_t __s2_125 = __p2_125; \ 22288 int32x4_t __rev0_125; __rev0_125 = __builtin_shufflevector(__s0_125, __s0_125, 3, 2, 1, 0); \ 22289 int16x4_t __rev1_125; __rev1_125 = __builtin_shufflevector(__s1_125, __s1_125, 3, 2, 1, 0); \ 22290 int16x4_t __rev2_125; __rev2_125 = __builtin_shufflevector(__s2_125, __s2_125, 3, 2, 1, 0); \ 22291 __ret_125 = __noswap_vqdmlal_s16(__rev0_125, __rev1_125, __noswap_splat_lane_s16(__rev2_125, __p3_125)); \ 22292 __ret_125 = __builtin_shufflevector(__ret_125, __ret_125, 3, 2, 1, 0); \ 22293 __ret_125; \ 22294 }) 22295 #endif 22296 22297 #ifdef __LITTLE_ENDIAN__ 22298 __ai __attribute__((target("neon"))) int64x2_t vqdmlal_n_s32(int64x2_t __p0, int32x2_t __p1, int32_t __p2) { 22299 int64x2_t __ret; 22300 __ret = vqdmlal_s32(__p0, __p1, (int32x2_t) {__p2, __p2}); 22301 return __ret; 22302 } 22303 #else 22304 __ai __attribute__((target("neon"))) int64x2_t vqdmlal_n_s32(int64x2_t __p0, int32x2_t __p1, int32_t __p2) { 22305 int64x2_t __ret; 22306 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 22307 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 22308 __ret = __noswap_vqdmlal_s32(__rev0, __rev1, (int32x2_t) {__p2, __p2}); 22309 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 22310 return __ret; 22311 } 22312 __ai __attribute__((target("neon"))) int64x2_t __noswap_vqdmlal_n_s32(int64x2_t __p0, int32x2_t __p1, int32_t __p2) { 22313 int64x2_t __ret; 22314 __ret = __noswap_vqdmlal_s32(__p0, __p1, (int32x2_t) {__p2, __p2}); 22315 return __ret; 22316 } 22317 #endif 22318 22319 #ifdef __LITTLE_ENDIAN__ 22320 __ai __attribute__((target("neon"))) int32x4_t vqdmlal_n_s16(int32x4_t __p0, int16x4_t __p1, int16_t __p2) { 22321 int32x4_t __ret; 22322 __ret = vqdmlal_s16(__p0, __p1, (int16x4_t) {__p2, __p2, __p2, __p2}); 22323 return __ret; 22324 } 22325 #else 22326 __ai __attribute__((target("neon"))) int32x4_t vqdmlal_n_s16(int32x4_t __p0, int16x4_t __p1, int16_t __p2) { 22327 int32x4_t __ret; 22328 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 22329 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 22330 __ret = __noswap_vqdmlal_s16(__rev0, __rev1, (int16x4_t) {__p2, __p2, __p2, __p2}); 22331 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 22332 return __ret; 22333 } 22334 __ai __attribute__((target("neon"))) int32x4_t __noswap_vqdmlal_n_s16(int32x4_t __p0, int16x4_t __p1, int16_t __p2) { 22335 int32x4_t __ret; 22336 __ret = __noswap_vqdmlal_s16(__p0, __p1, (int16x4_t) {__p2, __p2, __p2, __p2}); 22337 return __ret; 22338 } 22339 #endif 22340 22341 #ifdef __LITTLE_ENDIAN__ 22342 __ai __attribute__((target("neon"))) int64x2_t vqdmlsl_s32(int64x2_t __p0, int32x2_t __p1, int32x2_t __p2) { 22343 int64x2_t __ret; 22344 __ret = (int64x2_t) __builtin_neon_vqdmlsl_v((int8x16_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 35); 22345 return __ret; 22346 } 22347 #else 22348 __ai __attribute__((target("neon"))) int64x2_t vqdmlsl_s32(int64x2_t __p0, int32x2_t __p1, int32x2_t __p2) { 22349 int64x2_t __ret; 22350 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 22351 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 22352 int32x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 22353 __ret = (int64x2_t) __builtin_neon_vqdmlsl_v((int8x16_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 35); 22354 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 22355 return __ret; 22356 } 22357 __ai __attribute__((target("neon"))) int64x2_t __noswap_vqdmlsl_s32(int64x2_t __p0, int32x2_t __p1, int32x2_t __p2) { 22358 int64x2_t __ret; 22359 __ret = (int64x2_t) __builtin_neon_vqdmlsl_v((int8x16_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 35); 22360 return __ret; 22361 } 22362 #endif 22363 22364 #ifdef __LITTLE_ENDIAN__ 22365 __ai __attribute__((target("neon"))) int32x4_t vqdmlsl_s16(int32x4_t __p0, int16x4_t __p1, int16x4_t __p2) { 22366 int32x4_t __ret; 22367 __ret = (int32x4_t) __builtin_neon_vqdmlsl_v((int8x16_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 34); 22368 return __ret; 22369 } 22370 #else 22371 __ai __attribute__((target("neon"))) int32x4_t vqdmlsl_s16(int32x4_t __p0, int16x4_t __p1, int16x4_t __p2) { 22372 int32x4_t __ret; 22373 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 22374 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 22375 int16x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 22376 __ret = (int32x4_t) __builtin_neon_vqdmlsl_v((int8x16_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 34); 22377 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 22378 return __ret; 22379 } 22380 __ai __attribute__((target("neon"))) int32x4_t __noswap_vqdmlsl_s16(int32x4_t __p0, int16x4_t __p1, int16x4_t __p2) { 22381 int32x4_t __ret; 22382 __ret = (int32x4_t) __builtin_neon_vqdmlsl_v((int8x16_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 34); 22383 return __ret; 22384 } 22385 #endif 22386 22387 #ifdef __LITTLE_ENDIAN__ 22388 #define vqdmlsl_lane_s32(__p0_126, __p1_126, __p2_126, __p3_126) __extension__ ({ \ 22389 int64x2_t __ret_126; \ 22390 int64x2_t __s0_126 = __p0_126; \ 22391 int32x2_t __s1_126 = __p1_126; \ 22392 int32x2_t __s2_126 = __p2_126; \ 22393 __ret_126 = vqdmlsl_s32(__s0_126, __s1_126, splat_lane_s32(__s2_126, __p3_126)); \ 22394 __ret_126; \ 22395 }) 22396 #else 22397 #define vqdmlsl_lane_s32(__p0_127, __p1_127, __p2_127, __p3_127) __extension__ ({ \ 22398 int64x2_t __ret_127; \ 22399 int64x2_t __s0_127 = __p0_127; \ 22400 int32x2_t __s1_127 = __p1_127; \ 22401 int32x2_t __s2_127 = __p2_127; \ 22402 int64x2_t __rev0_127; __rev0_127 = __builtin_shufflevector(__s0_127, __s0_127, 1, 0); \ 22403 int32x2_t __rev1_127; __rev1_127 = __builtin_shufflevector(__s1_127, __s1_127, 1, 0); \ 22404 int32x2_t __rev2_127; __rev2_127 = __builtin_shufflevector(__s2_127, __s2_127, 1, 0); \ 22405 __ret_127 = __noswap_vqdmlsl_s32(__rev0_127, __rev1_127, __noswap_splat_lane_s32(__rev2_127, __p3_127)); \ 22406 __ret_127 = __builtin_shufflevector(__ret_127, __ret_127, 1, 0); \ 22407 __ret_127; \ 22408 }) 22409 #endif 22410 22411 #ifdef __LITTLE_ENDIAN__ 22412 #define vqdmlsl_lane_s16(__p0_128, __p1_128, __p2_128, __p3_128) __extension__ ({ \ 22413 int32x4_t __ret_128; \ 22414 int32x4_t __s0_128 = __p0_128; \ 22415 int16x4_t __s1_128 = __p1_128; \ 22416 int16x4_t __s2_128 = __p2_128; \ 22417 __ret_128 = vqdmlsl_s16(__s0_128, __s1_128, splat_lane_s16(__s2_128, __p3_128)); \ 22418 __ret_128; \ 22419 }) 22420 #else 22421 #define vqdmlsl_lane_s16(__p0_129, __p1_129, __p2_129, __p3_129) __extension__ ({ \ 22422 int32x4_t __ret_129; \ 22423 int32x4_t __s0_129 = __p0_129; \ 22424 int16x4_t __s1_129 = __p1_129; \ 22425 int16x4_t __s2_129 = __p2_129; \ 22426 int32x4_t __rev0_129; __rev0_129 = __builtin_shufflevector(__s0_129, __s0_129, 3, 2, 1, 0); \ 22427 int16x4_t __rev1_129; __rev1_129 = __builtin_shufflevector(__s1_129, __s1_129, 3, 2, 1, 0); \ 22428 int16x4_t __rev2_129; __rev2_129 = __builtin_shufflevector(__s2_129, __s2_129, 3, 2, 1, 0); \ 22429 __ret_129 = __noswap_vqdmlsl_s16(__rev0_129, __rev1_129, __noswap_splat_lane_s16(__rev2_129, __p3_129)); \ 22430 __ret_129 = __builtin_shufflevector(__ret_129, __ret_129, 3, 2, 1, 0); \ 22431 __ret_129; \ 22432 }) 22433 #endif 22434 22435 #ifdef __LITTLE_ENDIAN__ 22436 __ai __attribute__((target("neon"))) int64x2_t vqdmlsl_n_s32(int64x2_t __p0, int32x2_t __p1, int32_t __p2) { 22437 int64x2_t __ret; 22438 __ret = vqdmlsl_s32(__p0, __p1, (int32x2_t) {__p2, __p2}); 22439 return __ret; 22440 } 22441 #else 22442 __ai __attribute__((target("neon"))) int64x2_t vqdmlsl_n_s32(int64x2_t __p0, int32x2_t __p1, int32_t __p2) { 22443 int64x2_t __ret; 22444 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 22445 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 22446 __ret = __noswap_vqdmlsl_s32(__rev0, __rev1, (int32x2_t) {__p2, __p2}); 22447 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 22448 return __ret; 22449 } 22450 __ai __attribute__((target("neon"))) int64x2_t __noswap_vqdmlsl_n_s32(int64x2_t __p0, int32x2_t __p1, int32_t __p2) { 22451 int64x2_t __ret; 22452 __ret = __noswap_vqdmlsl_s32(__p0, __p1, (int32x2_t) {__p2, __p2}); 22453 return __ret; 22454 } 22455 #endif 22456 22457 #ifdef __LITTLE_ENDIAN__ 22458 __ai __attribute__((target("neon"))) int32x4_t vqdmlsl_n_s16(int32x4_t __p0, int16x4_t __p1, int16_t __p2) { 22459 int32x4_t __ret; 22460 __ret = vqdmlsl_s16(__p0, __p1, (int16x4_t) {__p2, __p2, __p2, __p2}); 22461 return __ret; 22462 } 22463 #else 22464 __ai __attribute__((target("neon"))) int32x4_t vqdmlsl_n_s16(int32x4_t __p0, int16x4_t __p1, int16_t __p2) { 22465 int32x4_t __ret; 22466 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 22467 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 22468 __ret = __noswap_vqdmlsl_s16(__rev0, __rev1, (int16x4_t) {__p2, __p2, __p2, __p2}); 22469 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 22470 return __ret; 22471 } 22472 __ai __attribute__((target("neon"))) int32x4_t __noswap_vqdmlsl_n_s16(int32x4_t __p0, int16x4_t __p1, int16_t __p2) { 22473 int32x4_t __ret; 22474 __ret = __noswap_vqdmlsl_s16(__p0, __p1, (int16x4_t) {__p2, __p2, __p2, __p2}); 22475 return __ret; 22476 } 22477 #endif 22478 22479 #ifdef __LITTLE_ENDIAN__ 22480 __ai __attribute__((target("neon"))) int32x4_t vqdmulhq_s32(int32x4_t __p0, int32x4_t __p1) { 22481 int32x4_t __ret; 22482 __ret = (int32x4_t) __builtin_neon_vqdmulhq_v((int8x16_t)__p0, (int8x16_t)__p1, 34); 22483 return __ret; 22484 } 22485 #else 22486 __ai __attribute__((target("neon"))) int32x4_t vqdmulhq_s32(int32x4_t __p0, int32x4_t __p1) { 22487 int32x4_t __ret; 22488 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 22489 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 22490 __ret = (int32x4_t) __builtin_neon_vqdmulhq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34); 22491 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 22492 return __ret; 22493 } 22494 __ai __attribute__((target("neon"))) int32x4_t __noswap_vqdmulhq_s32(int32x4_t __p0, int32x4_t __p1) { 22495 int32x4_t __ret; 22496 __ret = (int32x4_t) __builtin_neon_vqdmulhq_v((int8x16_t)__p0, (int8x16_t)__p1, 34); 22497 return __ret; 22498 } 22499 #endif 22500 22501 #ifdef __LITTLE_ENDIAN__ 22502 __ai __attribute__((target("neon"))) int16x8_t vqdmulhq_s16(int16x8_t __p0, int16x8_t __p1) { 22503 int16x8_t __ret; 22504 __ret = (int16x8_t) __builtin_neon_vqdmulhq_v((int8x16_t)__p0, (int8x16_t)__p1, 33); 22505 return __ret; 22506 } 22507 #else 22508 __ai __attribute__((target("neon"))) int16x8_t vqdmulhq_s16(int16x8_t __p0, int16x8_t __p1) { 22509 int16x8_t __ret; 22510 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 22511 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 22512 __ret = (int16x8_t) __builtin_neon_vqdmulhq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33); 22513 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 22514 return __ret; 22515 } 22516 __ai __attribute__((target("neon"))) int16x8_t __noswap_vqdmulhq_s16(int16x8_t __p0, int16x8_t __p1) { 22517 int16x8_t __ret; 22518 __ret = (int16x8_t) __builtin_neon_vqdmulhq_v((int8x16_t)__p0, (int8x16_t)__p1, 33); 22519 return __ret; 22520 } 22521 #endif 22522 22523 #ifdef __LITTLE_ENDIAN__ 22524 __ai __attribute__((target("neon"))) int32x2_t vqdmulh_s32(int32x2_t __p0, int32x2_t __p1) { 22525 int32x2_t __ret; 22526 __ret = (int32x2_t) __builtin_neon_vqdmulh_v((int8x8_t)__p0, (int8x8_t)__p1, 2); 22527 return __ret; 22528 } 22529 #else 22530 __ai __attribute__((target("neon"))) int32x2_t vqdmulh_s32(int32x2_t __p0, int32x2_t __p1) { 22531 int32x2_t __ret; 22532 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 22533 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 22534 __ret = (int32x2_t) __builtin_neon_vqdmulh_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2); 22535 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 22536 return __ret; 22537 } 22538 __ai __attribute__((target("neon"))) int32x2_t __noswap_vqdmulh_s32(int32x2_t __p0, int32x2_t __p1) { 22539 int32x2_t __ret; 22540 __ret = (int32x2_t) __builtin_neon_vqdmulh_v((int8x8_t)__p0, (int8x8_t)__p1, 2); 22541 return __ret; 22542 } 22543 #endif 22544 22545 #ifdef __LITTLE_ENDIAN__ 22546 __ai __attribute__((target("neon"))) int16x4_t vqdmulh_s16(int16x4_t __p0, int16x4_t __p1) { 22547 int16x4_t __ret; 22548 __ret = (int16x4_t) __builtin_neon_vqdmulh_v((int8x8_t)__p0, (int8x8_t)__p1, 1); 22549 return __ret; 22550 } 22551 #else 22552 __ai __attribute__((target("neon"))) int16x4_t vqdmulh_s16(int16x4_t __p0, int16x4_t __p1) { 22553 int16x4_t __ret; 22554 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 22555 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 22556 __ret = (int16x4_t) __builtin_neon_vqdmulh_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1); 22557 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 22558 return __ret; 22559 } 22560 __ai __attribute__((target("neon"))) int16x4_t __noswap_vqdmulh_s16(int16x4_t __p0, int16x4_t __p1) { 22561 int16x4_t __ret; 22562 __ret = (int16x4_t) __builtin_neon_vqdmulh_v((int8x8_t)__p0, (int8x8_t)__p1, 1); 22563 return __ret; 22564 } 22565 #endif 22566 22567 #ifdef __LITTLE_ENDIAN__ 22568 __ai __attribute__((target("neon"))) int32x4_t vqdmulhq_n_s32(int32x4_t __p0, int32_t __p1) { 22569 int32x4_t __ret; 22570 __ret = vqdmulhq_s32(__p0, (int32x4_t) {__p1, __p1, __p1, __p1}); 22571 return __ret; 22572 } 22573 #else 22574 __ai __attribute__((target("neon"))) int32x4_t vqdmulhq_n_s32(int32x4_t __p0, int32_t __p1) { 22575 int32x4_t __ret; 22576 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 22577 __ret = __noswap_vqdmulhq_s32(__rev0, (int32x4_t) {__p1, __p1, __p1, __p1}); 22578 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 22579 return __ret; 22580 } 22581 #endif 22582 22583 #ifdef __LITTLE_ENDIAN__ 22584 __ai __attribute__((target("neon"))) int16x8_t vqdmulhq_n_s16(int16x8_t __p0, int16_t __p1) { 22585 int16x8_t __ret; 22586 __ret = vqdmulhq_s16(__p0, (int16x8_t) {__p1, __p1, __p1, __p1, __p1, __p1, __p1, __p1}); 22587 return __ret; 22588 } 22589 #else 22590 __ai __attribute__((target("neon"))) int16x8_t vqdmulhq_n_s16(int16x8_t __p0, int16_t __p1) { 22591 int16x8_t __ret; 22592 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 22593 __ret = __noswap_vqdmulhq_s16(__rev0, (int16x8_t) {__p1, __p1, __p1, __p1, __p1, __p1, __p1, __p1}); 22594 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 22595 return __ret; 22596 } 22597 #endif 22598 22599 #ifdef __LITTLE_ENDIAN__ 22600 __ai __attribute__((target("neon"))) int32x2_t vqdmulh_n_s32(int32x2_t __p0, int32_t __p1) { 22601 int32x2_t __ret; 22602 __ret = vqdmulh_s32(__p0, (int32x2_t) {__p1, __p1}); 22603 return __ret; 22604 } 22605 #else 22606 __ai __attribute__((target("neon"))) int32x2_t vqdmulh_n_s32(int32x2_t __p0, int32_t __p1) { 22607 int32x2_t __ret; 22608 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 22609 __ret = __noswap_vqdmulh_s32(__rev0, (int32x2_t) {__p1, __p1}); 22610 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 22611 return __ret; 22612 } 22613 #endif 22614 22615 #ifdef __LITTLE_ENDIAN__ 22616 __ai __attribute__((target("neon"))) int16x4_t vqdmulh_n_s16(int16x4_t __p0, int16_t __p1) { 22617 int16x4_t __ret; 22618 __ret = vqdmulh_s16(__p0, (int16x4_t) {__p1, __p1, __p1, __p1}); 22619 return __ret; 22620 } 22621 #else 22622 __ai __attribute__((target("neon"))) int16x4_t vqdmulh_n_s16(int16x4_t __p0, int16_t __p1) { 22623 int16x4_t __ret; 22624 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 22625 __ret = __noswap_vqdmulh_s16(__rev0, (int16x4_t) {__p1, __p1, __p1, __p1}); 22626 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 22627 return __ret; 22628 } 22629 #endif 22630 22631 #ifdef __LITTLE_ENDIAN__ 22632 __ai __attribute__((target("neon"))) int64x2_t vqdmull_s32(int32x2_t __p0, int32x2_t __p1) { 22633 int64x2_t __ret; 22634 __ret = (int64x2_t) __builtin_neon_vqdmull_v((int8x8_t)__p0, (int8x8_t)__p1, 35); 22635 return __ret; 22636 } 22637 #else 22638 __ai __attribute__((target("neon"))) int64x2_t vqdmull_s32(int32x2_t __p0, int32x2_t __p1) { 22639 int64x2_t __ret; 22640 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 22641 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 22642 __ret = (int64x2_t) __builtin_neon_vqdmull_v((int8x8_t)__rev0, (int8x8_t)__rev1, 35); 22643 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 22644 return __ret; 22645 } 22646 __ai __attribute__((target("neon"))) int64x2_t __noswap_vqdmull_s32(int32x2_t __p0, int32x2_t __p1) { 22647 int64x2_t __ret; 22648 __ret = (int64x2_t) __builtin_neon_vqdmull_v((int8x8_t)__p0, (int8x8_t)__p1, 35); 22649 return __ret; 22650 } 22651 #endif 22652 22653 #ifdef __LITTLE_ENDIAN__ 22654 __ai __attribute__((target("neon"))) int32x4_t vqdmull_s16(int16x4_t __p0, int16x4_t __p1) { 22655 int32x4_t __ret; 22656 __ret = (int32x4_t) __builtin_neon_vqdmull_v((int8x8_t)__p0, (int8x8_t)__p1, 34); 22657 return __ret; 22658 } 22659 #else 22660 __ai __attribute__((target("neon"))) int32x4_t vqdmull_s16(int16x4_t __p0, int16x4_t __p1) { 22661 int32x4_t __ret; 22662 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 22663 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 22664 __ret = (int32x4_t) __builtin_neon_vqdmull_v((int8x8_t)__rev0, (int8x8_t)__rev1, 34); 22665 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 22666 return __ret; 22667 } 22668 __ai __attribute__((target("neon"))) int32x4_t __noswap_vqdmull_s16(int16x4_t __p0, int16x4_t __p1) { 22669 int32x4_t __ret; 22670 __ret = (int32x4_t) __builtin_neon_vqdmull_v((int8x8_t)__p0, (int8x8_t)__p1, 34); 22671 return __ret; 22672 } 22673 #endif 22674 22675 #ifdef __LITTLE_ENDIAN__ 22676 #define vqdmull_lane_s32(__p0_130, __p1_130, __p2_130) __extension__ ({ \ 22677 int64x2_t __ret_130; \ 22678 int32x2_t __s0_130 = __p0_130; \ 22679 int32x2_t __s1_130 = __p1_130; \ 22680 __ret_130 = vqdmull_s32(__s0_130, splat_lane_s32(__s1_130, __p2_130)); \ 22681 __ret_130; \ 22682 }) 22683 #else 22684 #define vqdmull_lane_s32(__p0_131, __p1_131, __p2_131) __extension__ ({ \ 22685 int64x2_t __ret_131; \ 22686 int32x2_t __s0_131 = __p0_131; \ 22687 int32x2_t __s1_131 = __p1_131; \ 22688 int32x2_t __rev0_131; __rev0_131 = __builtin_shufflevector(__s0_131, __s0_131, 1, 0); \ 22689 int32x2_t __rev1_131; __rev1_131 = __builtin_shufflevector(__s1_131, __s1_131, 1, 0); \ 22690 __ret_131 = __noswap_vqdmull_s32(__rev0_131, __noswap_splat_lane_s32(__rev1_131, __p2_131)); \ 22691 __ret_131 = __builtin_shufflevector(__ret_131, __ret_131, 1, 0); \ 22692 __ret_131; \ 22693 }) 22694 #endif 22695 22696 #ifdef __LITTLE_ENDIAN__ 22697 #define vqdmull_lane_s16(__p0_132, __p1_132, __p2_132) __extension__ ({ \ 22698 int32x4_t __ret_132; \ 22699 int16x4_t __s0_132 = __p0_132; \ 22700 int16x4_t __s1_132 = __p1_132; \ 22701 __ret_132 = vqdmull_s16(__s0_132, splat_lane_s16(__s1_132, __p2_132)); \ 22702 __ret_132; \ 22703 }) 22704 #else 22705 #define vqdmull_lane_s16(__p0_133, __p1_133, __p2_133) __extension__ ({ \ 22706 int32x4_t __ret_133; \ 22707 int16x4_t __s0_133 = __p0_133; \ 22708 int16x4_t __s1_133 = __p1_133; \ 22709 int16x4_t __rev0_133; __rev0_133 = __builtin_shufflevector(__s0_133, __s0_133, 3, 2, 1, 0); \ 22710 int16x4_t __rev1_133; __rev1_133 = __builtin_shufflevector(__s1_133, __s1_133, 3, 2, 1, 0); \ 22711 __ret_133 = __noswap_vqdmull_s16(__rev0_133, __noswap_splat_lane_s16(__rev1_133, __p2_133)); \ 22712 __ret_133 = __builtin_shufflevector(__ret_133, __ret_133, 3, 2, 1, 0); \ 22713 __ret_133; \ 22714 }) 22715 #endif 22716 22717 #ifdef __LITTLE_ENDIAN__ 22718 __ai __attribute__((target("neon"))) int64x2_t vqdmull_n_s32(int32x2_t __p0, int32_t __p1) { 22719 int64x2_t __ret; 22720 __ret = vqdmull_s32(__p0, (int32x2_t) {__p1, __p1}); 22721 return __ret; 22722 } 22723 #else 22724 __ai __attribute__((target("neon"))) int64x2_t vqdmull_n_s32(int32x2_t __p0, int32_t __p1) { 22725 int64x2_t __ret; 22726 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 22727 __ret = __noswap_vqdmull_s32(__rev0, (int32x2_t) {__p1, __p1}); 22728 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 22729 return __ret; 22730 } 22731 __ai __attribute__((target("neon"))) int64x2_t __noswap_vqdmull_n_s32(int32x2_t __p0, int32_t __p1) { 22732 int64x2_t __ret; 22733 __ret = __noswap_vqdmull_s32(__p0, (int32x2_t) {__p1, __p1}); 22734 return __ret; 22735 } 22736 #endif 22737 22738 #ifdef __LITTLE_ENDIAN__ 22739 __ai __attribute__((target("neon"))) int32x4_t vqdmull_n_s16(int16x4_t __p0, int16_t __p1) { 22740 int32x4_t __ret; 22741 __ret = vqdmull_s16(__p0, (int16x4_t) {__p1, __p1, __p1, __p1}); 22742 return __ret; 22743 } 22744 #else 22745 __ai __attribute__((target("neon"))) int32x4_t vqdmull_n_s16(int16x4_t __p0, int16_t __p1) { 22746 int32x4_t __ret; 22747 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 22748 __ret = __noswap_vqdmull_s16(__rev0, (int16x4_t) {__p1, __p1, __p1, __p1}); 22749 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 22750 return __ret; 22751 } 22752 __ai __attribute__((target("neon"))) int32x4_t __noswap_vqdmull_n_s16(int16x4_t __p0, int16_t __p1) { 22753 int32x4_t __ret; 22754 __ret = __noswap_vqdmull_s16(__p0, (int16x4_t) {__p1, __p1, __p1, __p1}); 22755 return __ret; 22756 } 22757 #endif 22758 22759 #ifdef __LITTLE_ENDIAN__ 22760 __ai __attribute__((target("neon"))) uint16x4_t vqmovn_u32(uint32x4_t __p0) { 22761 uint16x4_t __ret; 22762 __ret = (uint16x4_t) __builtin_neon_vqmovn_v((int8x16_t)__p0, 17); 22763 return __ret; 22764 } 22765 #else 22766 __ai __attribute__((target("neon"))) uint16x4_t vqmovn_u32(uint32x4_t __p0) { 22767 uint16x4_t __ret; 22768 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 22769 __ret = (uint16x4_t) __builtin_neon_vqmovn_v((int8x16_t)__rev0, 17); 22770 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 22771 return __ret; 22772 } 22773 __ai __attribute__((target("neon"))) uint16x4_t __noswap_vqmovn_u32(uint32x4_t __p0) { 22774 uint16x4_t __ret; 22775 __ret = (uint16x4_t) __builtin_neon_vqmovn_v((int8x16_t)__p0, 17); 22776 return __ret; 22777 } 22778 #endif 22779 22780 #ifdef __LITTLE_ENDIAN__ 22781 __ai __attribute__((target("neon"))) uint32x2_t vqmovn_u64(uint64x2_t __p0) { 22782 uint32x2_t __ret; 22783 __ret = (uint32x2_t) __builtin_neon_vqmovn_v((int8x16_t)__p0, 18); 22784 return __ret; 22785 } 22786 #else 22787 __ai __attribute__((target("neon"))) uint32x2_t vqmovn_u64(uint64x2_t __p0) { 22788 uint32x2_t __ret; 22789 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 22790 __ret = (uint32x2_t) __builtin_neon_vqmovn_v((int8x16_t)__rev0, 18); 22791 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 22792 return __ret; 22793 } 22794 __ai __attribute__((target("neon"))) uint32x2_t __noswap_vqmovn_u64(uint64x2_t __p0) { 22795 uint32x2_t __ret; 22796 __ret = (uint32x2_t) __builtin_neon_vqmovn_v((int8x16_t)__p0, 18); 22797 return __ret; 22798 } 22799 #endif 22800 22801 #ifdef __LITTLE_ENDIAN__ 22802 __ai __attribute__((target("neon"))) uint8x8_t vqmovn_u16(uint16x8_t __p0) { 22803 uint8x8_t __ret; 22804 __ret = (uint8x8_t) __builtin_neon_vqmovn_v((int8x16_t)__p0, 16); 22805 return __ret; 22806 } 22807 #else 22808 __ai __attribute__((target("neon"))) uint8x8_t vqmovn_u16(uint16x8_t __p0) { 22809 uint8x8_t __ret; 22810 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 22811 __ret = (uint8x8_t) __builtin_neon_vqmovn_v((int8x16_t)__rev0, 16); 22812 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 22813 return __ret; 22814 } 22815 __ai __attribute__((target("neon"))) uint8x8_t __noswap_vqmovn_u16(uint16x8_t __p0) { 22816 uint8x8_t __ret; 22817 __ret = (uint8x8_t) __builtin_neon_vqmovn_v((int8x16_t)__p0, 16); 22818 return __ret; 22819 } 22820 #endif 22821 22822 #ifdef __LITTLE_ENDIAN__ 22823 __ai __attribute__((target("neon"))) int16x4_t vqmovn_s32(int32x4_t __p0) { 22824 int16x4_t __ret; 22825 __ret = (int16x4_t) __builtin_neon_vqmovn_v((int8x16_t)__p0, 1); 22826 return __ret; 22827 } 22828 #else 22829 __ai __attribute__((target("neon"))) int16x4_t vqmovn_s32(int32x4_t __p0) { 22830 int16x4_t __ret; 22831 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 22832 __ret = (int16x4_t) __builtin_neon_vqmovn_v((int8x16_t)__rev0, 1); 22833 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 22834 return __ret; 22835 } 22836 __ai __attribute__((target("neon"))) int16x4_t __noswap_vqmovn_s32(int32x4_t __p0) { 22837 int16x4_t __ret; 22838 __ret = (int16x4_t) __builtin_neon_vqmovn_v((int8x16_t)__p0, 1); 22839 return __ret; 22840 } 22841 #endif 22842 22843 #ifdef __LITTLE_ENDIAN__ 22844 __ai __attribute__((target("neon"))) int32x2_t vqmovn_s64(int64x2_t __p0) { 22845 int32x2_t __ret; 22846 __ret = (int32x2_t) __builtin_neon_vqmovn_v((int8x16_t)__p0, 2); 22847 return __ret; 22848 } 22849 #else 22850 __ai __attribute__((target("neon"))) int32x2_t vqmovn_s64(int64x2_t __p0) { 22851 int32x2_t __ret; 22852 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 22853 __ret = (int32x2_t) __builtin_neon_vqmovn_v((int8x16_t)__rev0, 2); 22854 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 22855 return __ret; 22856 } 22857 __ai __attribute__((target("neon"))) int32x2_t __noswap_vqmovn_s64(int64x2_t __p0) { 22858 int32x2_t __ret; 22859 __ret = (int32x2_t) __builtin_neon_vqmovn_v((int8x16_t)__p0, 2); 22860 return __ret; 22861 } 22862 #endif 22863 22864 #ifdef __LITTLE_ENDIAN__ 22865 __ai __attribute__((target("neon"))) int8x8_t vqmovn_s16(int16x8_t __p0) { 22866 int8x8_t __ret; 22867 __ret = (int8x8_t) __builtin_neon_vqmovn_v((int8x16_t)__p0, 0); 22868 return __ret; 22869 } 22870 #else 22871 __ai __attribute__((target("neon"))) int8x8_t vqmovn_s16(int16x8_t __p0) { 22872 int8x8_t __ret; 22873 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 22874 __ret = (int8x8_t) __builtin_neon_vqmovn_v((int8x16_t)__rev0, 0); 22875 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 22876 return __ret; 22877 } 22878 __ai __attribute__((target("neon"))) int8x8_t __noswap_vqmovn_s16(int16x8_t __p0) { 22879 int8x8_t __ret; 22880 __ret = (int8x8_t) __builtin_neon_vqmovn_v((int8x16_t)__p0, 0); 22881 return __ret; 22882 } 22883 #endif 22884 22885 #ifdef __LITTLE_ENDIAN__ 22886 __ai __attribute__((target("neon"))) uint16x4_t vqmovun_s32(int32x4_t __p0) { 22887 uint16x4_t __ret; 22888 __ret = (uint16x4_t) __builtin_neon_vqmovun_v((int8x16_t)__p0, 17); 22889 return __ret; 22890 } 22891 #else 22892 __ai __attribute__((target("neon"))) uint16x4_t vqmovun_s32(int32x4_t __p0) { 22893 uint16x4_t __ret; 22894 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 22895 __ret = (uint16x4_t) __builtin_neon_vqmovun_v((int8x16_t)__rev0, 17); 22896 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 22897 return __ret; 22898 } 22899 __ai __attribute__((target("neon"))) uint16x4_t __noswap_vqmovun_s32(int32x4_t __p0) { 22900 uint16x4_t __ret; 22901 __ret = (uint16x4_t) __builtin_neon_vqmovun_v((int8x16_t)__p0, 17); 22902 return __ret; 22903 } 22904 #endif 22905 22906 #ifdef __LITTLE_ENDIAN__ 22907 __ai __attribute__((target("neon"))) uint32x2_t vqmovun_s64(int64x2_t __p0) { 22908 uint32x2_t __ret; 22909 __ret = (uint32x2_t) __builtin_neon_vqmovun_v((int8x16_t)__p0, 18); 22910 return __ret; 22911 } 22912 #else 22913 __ai __attribute__((target("neon"))) uint32x2_t vqmovun_s64(int64x2_t __p0) { 22914 uint32x2_t __ret; 22915 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 22916 __ret = (uint32x2_t) __builtin_neon_vqmovun_v((int8x16_t)__rev0, 18); 22917 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 22918 return __ret; 22919 } 22920 __ai __attribute__((target("neon"))) uint32x2_t __noswap_vqmovun_s64(int64x2_t __p0) { 22921 uint32x2_t __ret; 22922 __ret = (uint32x2_t) __builtin_neon_vqmovun_v((int8x16_t)__p0, 18); 22923 return __ret; 22924 } 22925 #endif 22926 22927 #ifdef __LITTLE_ENDIAN__ 22928 __ai __attribute__((target("neon"))) uint8x8_t vqmovun_s16(int16x8_t __p0) { 22929 uint8x8_t __ret; 22930 __ret = (uint8x8_t) __builtin_neon_vqmovun_v((int8x16_t)__p0, 16); 22931 return __ret; 22932 } 22933 #else 22934 __ai __attribute__((target("neon"))) uint8x8_t vqmovun_s16(int16x8_t __p0) { 22935 uint8x8_t __ret; 22936 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 22937 __ret = (uint8x8_t) __builtin_neon_vqmovun_v((int8x16_t)__rev0, 16); 22938 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 22939 return __ret; 22940 } 22941 __ai __attribute__((target("neon"))) uint8x8_t __noswap_vqmovun_s16(int16x8_t __p0) { 22942 uint8x8_t __ret; 22943 __ret = (uint8x8_t) __builtin_neon_vqmovun_v((int8x16_t)__p0, 16); 22944 return __ret; 22945 } 22946 #endif 22947 22948 #ifdef __LITTLE_ENDIAN__ 22949 __ai __attribute__((target("neon"))) int8x16_t vqnegq_s8(int8x16_t __p0) { 22950 int8x16_t __ret; 22951 __ret = (int8x16_t) __builtin_neon_vqnegq_v((int8x16_t)__p0, 32); 22952 return __ret; 22953 } 22954 #else 22955 __ai __attribute__((target("neon"))) int8x16_t vqnegq_s8(int8x16_t __p0) { 22956 int8x16_t __ret; 22957 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 22958 __ret = (int8x16_t) __builtin_neon_vqnegq_v((int8x16_t)__rev0, 32); 22959 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 22960 return __ret; 22961 } 22962 #endif 22963 22964 #ifdef __LITTLE_ENDIAN__ 22965 __ai __attribute__((target("neon"))) int32x4_t vqnegq_s32(int32x4_t __p0) { 22966 int32x4_t __ret; 22967 __ret = (int32x4_t) __builtin_neon_vqnegq_v((int8x16_t)__p0, 34); 22968 return __ret; 22969 } 22970 #else 22971 __ai __attribute__((target("neon"))) int32x4_t vqnegq_s32(int32x4_t __p0) { 22972 int32x4_t __ret; 22973 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 22974 __ret = (int32x4_t) __builtin_neon_vqnegq_v((int8x16_t)__rev0, 34); 22975 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 22976 return __ret; 22977 } 22978 #endif 22979 22980 #ifdef __LITTLE_ENDIAN__ 22981 __ai __attribute__((target("neon"))) int16x8_t vqnegq_s16(int16x8_t __p0) { 22982 int16x8_t __ret; 22983 __ret = (int16x8_t) __builtin_neon_vqnegq_v((int8x16_t)__p0, 33); 22984 return __ret; 22985 } 22986 #else 22987 __ai __attribute__((target("neon"))) int16x8_t vqnegq_s16(int16x8_t __p0) { 22988 int16x8_t __ret; 22989 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 22990 __ret = (int16x8_t) __builtin_neon_vqnegq_v((int8x16_t)__rev0, 33); 22991 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 22992 return __ret; 22993 } 22994 #endif 22995 22996 #ifdef __LITTLE_ENDIAN__ 22997 __ai __attribute__((target("neon"))) int8x8_t vqneg_s8(int8x8_t __p0) { 22998 int8x8_t __ret; 22999 __ret = (int8x8_t) __builtin_neon_vqneg_v((int8x8_t)__p0, 0); 23000 return __ret; 23001 } 23002 #else 23003 __ai __attribute__((target("neon"))) int8x8_t vqneg_s8(int8x8_t __p0) { 23004 int8x8_t __ret; 23005 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 23006 __ret = (int8x8_t) __builtin_neon_vqneg_v((int8x8_t)__rev0, 0); 23007 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 23008 return __ret; 23009 } 23010 #endif 23011 23012 #ifdef __LITTLE_ENDIAN__ 23013 __ai __attribute__((target("neon"))) int32x2_t vqneg_s32(int32x2_t __p0) { 23014 int32x2_t __ret; 23015 __ret = (int32x2_t) __builtin_neon_vqneg_v((int8x8_t)__p0, 2); 23016 return __ret; 23017 } 23018 #else 23019 __ai __attribute__((target("neon"))) int32x2_t vqneg_s32(int32x2_t __p0) { 23020 int32x2_t __ret; 23021 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 23022 __ret = (int32x2_t) __builtin_neon_vqneg_v((int8x8_t)__rev0, 2); 23023 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 23024 return __ret; 23025 } 23026 #endif 23027 23028 #ifdef __LITTLE_ENDIAN__ 23029 __ai __attribute__((target("neon"))) int16x4_t vqneg_s16(int16x4_t __p0) { 23030 int16x4_t __ret; 23031 __ret = (int16x4_t) __builtin_neon_vqneg_v((int8x8_t)__p0, 1); 23032 return __ret; 23033 } 23034 #else 23035 __ai __attribute__((target("neon"))) int16x4_t vqneg_s16(int16x4_t __p0) { 23036 int16x4_t __ret; 23037 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 23038 __ret = (int16x4_t) __builtin_neon_vqneg_v((int8x8_t)__rev0, 1); 23039 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 23040 return __ret; 23041 } 23042 #endif 23043 23044 #ifdef __LITTLE_ENDIAN__ 23045 __ai __attribute__((target("neon"))) int32x4_t vqrdmulhq_s32(int32x4_t __p0, int32x4_t __p1) { 23046 int32x4_t __ret; 23047 __ret = (int32x4_t) __builtin_neon_vqrdmulhq_v((int8x16_t)__p0, (int8x16_t)__p1, 34); 23048 return __ret; 23049 } 23050 #else 23051 __ai __attribute__((target("neon"))) int32x4_t vqrdmulhq_s32(int32x4_t __p0, int32x4_t __p1) { 23052 int32x4_t __ret; 23053 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 23054 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 23055 __ret = (int32x4_t) __builtin_neon_vqrdmulhq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34); 23056 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 23057 return __ret; 23058 } 23059 __ai __attribute__((target("neon"))) int32x4_t __noswap_vqrdmulhq_s32(int32x4_t __p0, int32x4_t __p1) { 23060 int32x4_t __ret; 23061 __ret = (int32x4_t) __builtin_neon_vqrdmulhq_v((int8x16_t)__p0, (int8x16_t)__p1, 34); 23062 return __ret; 23063 } 23064 #endif 23065 23066 #ifdef __LITTLE_ENDIAN__ 23067 __ai __attribute__((target("neon"))) int16x8_t vqrdmulhq_s16(int16x8_t __p0, int16x8_t __p1) { 23068 int16x8_t __ret; 23069 __ret = (int16x8_t) __builtin_neon_vqrdmulhq_v((int8x16_t)__p0, (int8x16_t)__p1, 33); 23070 return __ret; 23071 } 23072 #else 23073 __ai __attribute__((target("neon"))) int16x8_t vqrdmulhq_s16(int16x8_t __p0, int16x8_t __p1) { 23074 int16x8_t __ret; 23075 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 23076 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 23077 __ret = (int16x8_t) __builtin_neon_vqrdmulhq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33); 23078 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 23079 return __ret; 23080 } 23081 __ai __attribute__((target("neon"))) int16x8_t __noswap_vqrdmulhq_s16(int16x8_t __p0, int16x8_t __p1) { 23082 int16x8_t __ret; 23083 __ret = (int16x8_t) __builtin_neon_vqrdmulhq_v((int8x16_t)__p0, (int8x16_t)__p1, 33); 23084 return __ret; 23085 } 23086 #endif 23087 23088 #ifdef __LITTLE_ENDIAN__ 23089 __ai __attribute__((target("neon"))) int32x2_t vqrdmulh_s32(int32x2_t __p0, int32x2_t __p1) { 23090 int32x2_t __ret; 23091 __ret = (int32x2_t) __builtin_neon_vqrdmulh_v((int8x8_t)__p0, (int8x8_t)__p1, 2); 23092 return __ret; 23093 } 23094 #else 23095 __ai __attribute__((target("neon"))) int32x2_t vqrdmulh_s32(int32x2_t __p0, int32x2_t __p1) { 23096 int32x2_t __ret; 23097 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 23098 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 23099 __ret = (int32x2_t) __builtin_neon_vqrdmulh_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2); 23100 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 23101 return __ret; 23102 } 23103 __ai __attribute__((target("neon"))) int32x2_t __noswap_vqrdmulh_s32(int32x2_t __p0, int32x2_t __p1) { 23104 int32x2_t __ret; 23105 __ret = (int32x2_t) __builtin_neon_vqrdmulh_v((int8x8_t)__p0, (int8x8_t)__p1, 2); 23106 return __ret; 23107 } 23108 #endif 23109 23110 #ifdef __LITTLE_ENDIAN__ 23111 __ai __attribute__((target("neon"))) int16x4_t vqrdmulh_s16(int16x4_t __p0, int16x4_t __p1) { 23112 int16x4_t __ret; 23113 __ret = (int16x4_t) __builtin_neon_vqrdmulh_v((int8x8_t)__p0, (int8x8_t)__p1, 1); 23114 return __ret; 23115 } 23116 #else 23117 __ai __attribute__((target("neon"))) int16x4_t vqrdmulh_s16(int16x4_t __p0, int16x4_t __p1) { 23118 int16x4_t __ret; 23119 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 23120 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 23121 __ret = (int16x4_t) __builtin_neon_vqrdmulh_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1); 23122 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 23123 return __ret; 23124 } 23125 __ai __attribute__((target("neon"))) int16x4_t __noswap_vqrdmulh_s16(int16x4_t __p0, int16x4_t __p1) { 23126 int16x4_t __ret; 23127 __ret = (int16x4_t) __builtin_neon_vqrdmulh_v((int8x8_t)__p0, (int8x8_t)__p1, 1); 23128 return __ret; 23129 } 23130 #endif 23131 23132 #ifdef __LITTLE_ENDIAN__ 23133 __ai __attribute__((target("neon"))) int32x4_t vqrdmulhq_n_s32(int32x4_t __p0, int32_t __p1) { 23134 int32x4_t __ret; 23135 __ret = vqrdmulhq_s32(__p0, (int32x4_t) {__p1, __p1, __p1, __p1}); 23136 return __ret; 23137 } 23138 #else 23139 __ai __attribute__((target("neon"))) int32x4_t vqrdmulhq_n_s32(int32x4_t __p0, int32_t __p1) { 23140 int32x4_t __ret; 23141 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 23142 __ret = __noswap_vqrdmulhq_s32(__rev0, (int32x4_t) {__p1, __p1, __p1, __p1}); 23143 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 23144 return __ret; 23145 } 23146 #endif 23147 23148 #ifdef __LITTLE_ENDIAN__ 23149 __ai __attribute__((target("neon"))) int16x8_t vqrdmulhq_n_s16(int16x8_t __p0, int16_t __p1) { 23150 int16x8_t __ret; 23151 __ret = vqrdmulhq_s16(__p0, (int16x8_t) {__p1, __p1, __p1, __p1, __p1, __p1, __p1, __p1}); 23152 return __ret; 23153 } 23154 #else 23155 __ai __attribute__((target("neon"))) int16x8_t vqrdmulhq_n_s16(int16x8_t __p0, int16_t __p1) { 23156 int16x8_t __ret; 23157 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 23158 __ret = __noswap_vqrdmulhq_s16(__rev0, (int16x8_t) {__p1, __p1, __p1, __p1, __p1, __p1, __p1, __p1}); 23159 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 23160 return __ret; 23161 } 23162 #endif 23163 23164 #ifdef __LITTLE_ENDIAN__ 23165 __ai __attribute__((target("neon"))) int32x2_t vqrdmulh_n_s32(int32x2_t __p0, int32_t __p1) { 23166 int32x2_t __ret; 23167 __ret = vqrdmulh_s32(__p0, (int32x2_t) {__p1, __p1}); 23168 return __ret; 23169 } 23170 #else 23171 __ai __attribute__((target("neon"))) int32x2_t vqrdmulh_n_s32(int32x2_t __p0, int32_t __p1) { 23172 int32x2_t __ret; 23173 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 23174 __ret = __noswap_vqrdmulh_s32(__rev0, (int32x2_t) {__p1, __p1}); 23175 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 23176 return __ret; 23177 } 23178 #endif 23179 23180 #ifdef __LITTLE_ENDIAN__ 23181 __ai __attribute__((target("neon"))) int16x4_t vqrdmulh_n_s16(int16x4_t __p0, int16_t __p1) { 23182 int16x4_t __ret; 23183 __ret = vqrdmulh_s16(__p0, (int16x4_t) {__p1, __p1, __p1, __p1}); 23184 return __ret; 23185 } 23186 #else 23187 __ai __attribute__((target("neon"))) int16x4_t vqrdmulh_n_s16(int16x4_t __p0, int16_t __p1) { 23188 int16x4_t __ret; 23189 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 23190 __ret = __noswap_vqrdmulh_s16(__rev0, (int16x4_t) {__p1, __p1, __p1, __p1}); 23191 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 23192 return __ret; 23193 } 23194 #endif 23195 23196 #ifdef __LITTLE_ENDIAN__ 23197 __ai __attribute__((target("neon"))) uint8x16_t vqrshlq_u8(uint8x16_t __p0, int8x16_t __p1) { 23198 uint8x16_t __ret; 23199 __ret = (uint8x16_t) __builtin_neon_vqrshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 48); 23200 return __ret; 23201 } 23202 #else 23203 __ai __attribute__((target("neon"))) uint8x16_t vqrshlq_u8(uint8x16_t __p0, int8x16_t __p1) { 23204 uint8x16_t __ret; 23205 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 23206 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 23207 __ret = (uint8x16_t) __builtin_neon_vqrshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48); 23208 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 23209 return __ret; 23210 } 23211 #endif 23212 23213 #ifdef __LITTLE_ENDIAN__ 23214 __ai __attribute__((target("neon"))) uint32x4_t vqrshlq_u32(uint32x4_t __p0, int32x4_t __p1) { 23215 uint32x4_t __ret; 23216 __ret = (uint32x4_t) __builtin_neon_vqrshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 50); 23217 return __ret; 23218 } 23219 #else 23220 __ai __attribute__((target("neon"))) uint32x4_t vqrshlq_u32(uint32x4_t __p0, int32x4_t __p1) { 23221 uint32x4_t __ret; 23222 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 23223 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 23224 __ret = (uint32x4_t) __builtin_neon_vqrshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50); 23225 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 23226 return __ret; 23227 } 23228 #endif 23229 23230 #ifdef __LITTLE_ENDIAN__ 23231 __ai __attribute__((target("neon"))) uint64x2_t vqrshlq_u64(uint64x2_t __p0, int64x2_t __p1) { 23232 uint64x2_t __ret; 23233 __ret = (uint64x2_t) __builtin_neon_vqrshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 51); 23234 return __ret; 23235 } 23236 #else 23237 __ai __attribute__((target("neon"))) uint64x2_t vqrshlq_u64(uint64x2_t __p0, int64x2_t __p1) { 23238 uint64x2_t __ret; 23239 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 23240 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 23241 __ret = (uint64x2_t) __builtin_neon_vqrshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 51); 23242 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 23243 return __ret; 23244 } 23245 #endif 23246 23247 #ifdef __LITTLE_ENDIAN__ 23248 __ai __attribute__((target("neon"))) uint16x8_t vqrshlq_u16(uint16x8_t __p0, int16x8_t __p1) { 23249 uint16x8_t __ret; 23250 __ret = (uint16x8_t) __builtin_neon_vqrshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 49); 23251 return __ret; 23252 } 23253 #else 23254 __ai __attribute__((target("neon"))) uint16x8_t vqrshlq_u16(uint16x8_t __p0, int16x8_t __p1) { 23255 uint16x8_t __ret; 23256 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 23257 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 23258 __ret = (uint16x8_t) __builtin_neon_vqrshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49); 23259 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 23260 return __ret; 23261 } 23262 #endif 23263 23264 #ifdef __LITTLE_ENDIAN__ 23265 __ai __attribute__((target("neon"))) int8x16_t vqrshlq_s8(int8x16_t __p0, int8x16_t __p1) { 23266 int8x16_t __ret; 23267 __ret = (int8x16_t) __builtin_neon_vqrshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 32); 23268 return __ret; 23269 } 23270 #else 23271 __ai __attribute__((target("neon"))) int8x16_t vqrshlq_s8(int8x16_t __p0, int8x16_t __p1) { 23272 int8x16_t __ret; 23273 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 23274 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 23275 __ret = (int8x16_t) __builtin_neon_vqrshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32); 23276 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 23277 return __ret; 23278 } 23279 #endif 23280 23281 #ifdef __LITTLE_ENDIAN__ 23282 __ai __attribute__((target("neon"))) int32x4_t vqrshlq_s32(int32x4_t __p0, int32x4_t __p1) { 23283 int32x4_t __ret; 23284 __ret = (int32x4_t) __builtin_neon_vqrshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 34); 23285 return __ret; 23286 } 23287 #else 23288 __ai __attribute__((target("neon"))) int32x4_t vqrshlq_s32(int32x4_t __p0, int32x4_t __p1) { 23289 int32x4_t __ret; 23290 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 23291 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 23292 __ret = (int32x4_t) __builtin_neon_vqrshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34); 23293 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 23294 return __ret; 23295 } 23296 #endif 23297 23298 #ifdef __LITTLE_ENDIAN__ 23299 __ai __attribute__((target("neon"))) int64x2_t vqrshlq_s64(int64x2_t __p0, int64x2_t __p1) { 23300 int64x2_t __ret; 23301 __ret = (int64x2_t) __builtin_neon_vqrshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 35); 23302 return __ret; 23303 } 23304 #else 23305 __ai __attribute__((target("neon"))) int64x2_t vqrshlq_s64(int64x2_t __p0, int64x2_t __p1) { 23306 int64x2_t __ret; 23307 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 23308 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 23309 __ret = (int64x2_t) __builtin_neon_vqrshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 35); 23310 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 23311 return __ret; 23312 } 23313 #endif 23314 23315 #ifdef __LITTLE_ENDIAN__ 23316 __ai __attribute__((target("neon"))) int16x8_t vqrshlq_s16(int16x8_t __p0, int16x8_t __p1) { 23317 int16x8_t __ret; 23318 __ret = (int16x8_t) __builtin_neon_vqrshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 33); 23319 return __ret; 23320 } 23321 #else 23322 __ai __attribute__((target("neon"))) int16x8_t vqrshlq_s16(int16x8_t __p0, int16x8_t __p1) { 23323 int16x8_t __ret; 23324 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 23325 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 23326 __ret = (int16x8_t) __builtin_neon_vqrshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33); 23327 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 23328 return __ret; 23329 } 23330 #endif 23331 23332 #ifdef __LITTLE_ENDIAN__ 23333 __ai __attribute__((target("neon"))) uint8x8_t vqrshl_u8(uint8x8_t __p0, int8x8_t __p1) { 23334 uint8x8_t __ret; 23335 __ret = (uint8x8_t) __builtin_neon_vqrshl_v((int8x8_t)__p0, (int8x8_t)__p1, 16); 23336 return __ret; 23337 } 23338 #else 23339 __ai __attribute__((target("neon"))) uint8x8_t vqrshl_u8(uint8x8_t __p0, int8x8_t __p1) { 23340 uint8x8_t __ret; 23341 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 23342 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 23343 __ret = (uint8x8_t) __builtin_neon_vqrshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16); 23344 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 23345 return __ret; 23346 } 23347 #endif 23348 23349 #ifdef __LITTLE_ENDIAN__ 23350 __ai __attribute__((target("neon"))) uint32x2_t vqrshl_u32(uint32x2_t __p0, int32x2_t __p1) { 23351 uint32x2_t __ret; 23352 __ret = (uint32x2_t) __builtin_neon_vqrshl_v((int8x8_t)__p0, (int8x8_t)__p1, 18); 23353 return __ret; 23354 } 23355 #else 23356 __ai __attribute__((target("neon"))) uint32x2_t vqrshl_u32(uint32x2_t __p0, int32x2_t __p1) { 23357 uint32x2_t __ret; 23358 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 23359 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 23360 __ret = (uint32x2_t) __builtin_neon_vqrshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18); 23361 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 23362 return __ret; 23363 } 23364 #endif 23365 23366 __ai __attribute__((target("neon"))) uint64x1_t vqrshl_u64(uint64x1_t __p0, int64x1_t __p1) { 23367 uint64x1_t __ret; 23368 __ret = (uint64x1_t) __builtin_neon_vqrshl_v((int8x8_t)__p0, (int8x8_t)__p1, 19); 23369 return __ret; 23370 } 23371 #ifdef __LITTLE_ENDIAN__ 23372 __ai __attribute__((target("neon"))) uint16x4_t vqrshl_u16(uint16x4_t __p0, int16x4_t __p1) { 23373 uint16x4_t __ret; 23374 __ret = (uint16x4_t) __builtin_neon_vqrshl_v((int8x8_t)__p0, (int8x8_t)__p1, 17); 23375 return __ret; 23376 } 23377 #else 23378 __ai __attribute__((target("neon"))) uint16x4_t vqrshl_u16(uint16x4_t __p0, int16x4_t __p1) { 23379 uint16x4_t __ret; 23380 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 23381 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 23382 __ret = (uint16x4_t) __builtin_neon_vqrshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17); 23383 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 23384 return __ret; 23385 } 23386 #endif 23387 23388 #ifdef __LITTLE_ENDIAN__ 23389 __ai __attribute__((target("neon"))) int8x8_t vqrshl_s8(int8x8_t __p0, int8x8_t __p1) { 23390 int8x8_t __ret; 23391 __ret = (int8x8_t) __builtin_neon_vqrshl_v((int8x8_t)__p0, (int8x8_t)__p1, 0); 23392 return __ret; 23393 } 23394 #else 23395 __ai __attribute__((target("neon"))) int8x8_t vqrshl_s8(int8x8_t __p0, int8x8_t __p1) { 23396 int8x8_t __ret; 23397 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 23398 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 23399 __ret = (int8x8_t) __builtin_neon_vqrshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0); 23400 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 23401 return __ret; 23402 } 23403 #endif 23404 23405 #ifdef __LITTLE_ENDIAN__ 23406 __ai __attribute__((target("neon"))) int32x2_t vqrshl_s32(int32x2_t __p0, int32x2_t __p1) { 23407 int32x2_t __ret; 23408 __ret = (int32x2_t) __builtin_neon_vqrshl_v((int8x8_t)__p0, (int8x8_t)__p1, 2); 23409 return __ret; 23410 } 23411 #else 23412 __ai __attribute__((target("neon"))) int32x2_t vqrshl_s32(int32x2_t __p0, int32x2_t __p1) { 23413 int32x2_t __ret; 23414 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 23415 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 23416 __ret = (int32x2_t) __builtin_neon_vqrshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2); 23417 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 23418 return __ret; 23419 } 23420 #endif 23421 23422 __ai __attribute__((target("neon"))) int64x1_t vqrshl_s64(int64x1_t __p0, int64x1_t __p1) { 23423 int64x1_t __ret; 23424 __ret = (int64x1_t) __builtin_neon_vqrshl_v((int8x8_t)__p0, (int8x8_t)__p1, 3); 23425 return __ret; 23426 } 23427 #ifdef __LITTLE_ENDIAN__ 23428 __ai __attribute__((target("neon"))) int16x4_t vqrshl_s16(int16x4_t __p0, int16x4_t __p1) { 23429 int16x4_t __ret; 23430 __ret = (int16x4_t) __builtin_neon_vqrshl_v((int8x8_t)__p0, (int8x8_t)__p1, 1); 23431 return __ret; 23432 } 23433 #else 23434 __ai __attribute__((target("neon"))) int16x4_t vqrshl_s16(int16x4_t __p0, int16x4_t __p1) { 23435 int16x4_t __ret; 23436 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 23437 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 23438 __ret = (int16x4_t) __builtin_neon_vqrshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1); 23439 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 23440 return __ret; 23441 } 23442 #endif 23443 23444 #ifdef __LITTLE_ENDIAN__ 23445 #define vqrshrn_n_u32(__p0, __p1) __extension__ ({ \ 23446 uint16x4_t __ret; \ 23447 uint32x4_t __s0 = __p0; \ 23448 __ret = (uint16x4_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__s0, __p1, 17); \ 23449 __ret; \ 23450 }) 23451 #else 23452 #define vqrshrn_n_u32(__p0, __p1) __extension__ ({ \ 23453 uint16x4_t __ret; \ 23454 uint32x4_t __s0 = __p0; \ 23455 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 23456 __ret = (uint16x4_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__rev0, __p1, 17); \ 23457 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 23458 __ret; \ 23459 }) 23460 #define __noswap_vqrshrn_n_u32(__p0, __p1) __extension__ ({ \ 23461 uint16x4_t __ret; \ 23462 uint32x4_t __s0 = __p0; \ 23463 __ret = (uint16x4_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__s0, __p1, 17); \ 23464 __ret; \ 23465 }) 23466 #endif 23467 23468 #ifdef __LITTLE_ENDIAN__ 23469 #define vqrshrn_n_u64(__p0, __p1) __extension__ ({ \ 23470 uint32x2_t __ret; \ 23471 uint64x2_t __s0 = __p0; \ 23472 __ret = (uint32x2_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__s0, __p1, 18); \ 23473 __ret; \ 23474 }) 23475 #else 23476 #define vqrshrn_n_u64(__p0, __p1) __extension__ ({ \ 23477 uint32x2_t __ret; \ 23478 uint64x2_t __s0 = __p0; \ 23479 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 23480 __ret = (uint32x2_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__rev0, __p1, 18); \ 23481 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 23482 __ret; \ 23483 }) 23484 #define __noswap_vqrshrn_n_u64(__p0, __p1) __extension__ ({ \ 23485 uint32x2_t __ret; \ 23486 uint64x2_t __s0 = __p0; \ 23487 __ret = (uint32x2_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__s0, __p1, 18); \ 23488 __ret; \ 23489 }) 23490 #endif 23491 23492 #ifdef __LITTLE_ENDIAN__ 23493 #define vqrshrn_n_u16(__p0, __p1) __extension__ ({ \ 23494 uint8x8_t __ret; \ 23495 uint16x8_t __s0 = __p0; \ 23496 __ret = (uint8x8_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__s0, __p1, 16); \ 23497 __ret; \ 23498 }) 23499 #else 23500 #define vqrshrn_n_u16(__p0, __p1) __extension__ ({ \ 23501 uint8x8_t __ret; \ 23502 uint16x8_t __s0 = __p0; \ 23503 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 23504 __ret = (uint8x8_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__rev0, __p1, 16); \ 23505 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 23506 __ret; \ 23507 }) 23508 #define __noswap_vqrshrn_n_u16(__p0, __p1) __extension__ ({ \ 23509 uint8x8_t __ret; \ 23510 uint16x8_t __s0 = __p0; \ 23511 __ret = (uint8x8_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__s0, __p1, 16); \ 23512 __ret; \ 23513 }) 23514 #endif 23515 23516 #ifdef __LITTLE_ENDIAN__ 23517 #define vqrshrn_n_s32(__p0, __p1) __extension__ ({ \ 23518 int16x4_t __ret; \ 23519 int32x4_t __s0 = __p0; \ 23520 __ret = (int16x4_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__s0, __p1, 1); \ 23521 __ret; \ 23522 }) 23523 #else 23524 #define vqrshrn_n_s32(__p0, __p1) __extension__ ({ \ 23525 int16x4_t __ret; \ 23526 int32x4_t __s0 = __p0; \ 23527 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 23528 __ret = (int16x4_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__rev0, __p1, 1); \ 23529 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 23530 __ret; \ 23531 }) 23532 #define __noswap_vqrshrn_n_s32(__p0, __p1) __extension__ ({ \ 23533 int16x4_t __ret; \ 23534 int32x4_t __s0 = __p0; \ 23535 __ret = (int16x4_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__s0, __p1, 1); \ 23536 __ret; \ 23537 }) 23538 #endif 23539 23540 #ifdef __LITTLE_ENDIAN__ 23541 #define vqrshrn_n_s64(__p0, __p1) __extension__ ({ \ 23542 int32x2_t __ret; \ 23543 int64x2_t __s0 = __p0; \ 23544 __ret = (int32x2_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__s0, __p1, 2); \ 23545 __ret; \ 23546 }) 23547 #else 23548 #define vqrshrn_n_s64(__p0, __p1) __extension__ ({ \ 23549 int32x2_t __ret; \ 23550 int64x2_t __s0 = __p0; \ 23551 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 23552 __ret = (int32x2_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__rev0, __p1, 2); \ 23553 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 23554 __ret; \ 23555 }) 23556 #define __noswap_vqrshrn_n_s64(__p0, __p1) __extension__ ({ \ 23557 int32x2_t __ret; \ 23558 int64x2_t __s0 = __p0; \ 23559 __ret = (int32x2_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__s0, __p1, 2); \ 23560 __ret; \ 23561 }) 23562 #endif 23563 23564 #ifdef __LITTLE_ENDIAN__ 23565 #define vqrshrn_n_s16(__p0, __p1) __extension__ ({ \ 23566 int8x8_t __ret; \ 23567 int16x8_t __s0 = __p0; \ 23568 __ret = (int8x8_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__s0, __p1, 0); \ 23569 __ret; \ 23570 }) 23571 #else 23572 #define vqrshrn_n_s16(__p0, __p1) __extension__ ({ \ 23573 int8x8_t __ret; \ 23574 int16x8_t __s0 = __p0; \ 23575 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 23576 __ret = (int8x8_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__rev0, __p1, 0); \ 23577 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 23578 __ret; \ 23579 }) 23580 #define __noswap_vqrshrn_n_s16(__p0, __p1) __extension__ ({ \ 23581 int8x8_t __ret; \ 23582 int16x8_t __s0 = __p0; \ 23583 __ret = (int8x8_t) __builtin_neon_vqrshrn_n_v((int8x16_t)__s0, __p1, 0); \ 23584 __ret; \ 23585 }) 23586 #endif 23587 23588 #ifdef __LITTLE_ENDIAN__ 23589 #define vqrshrun_n_s32(__p0, __p1) __extension__ ({ \ 23590 uint16x4_t __ret; \ 23591 int32x4_t __s0 = __p0; \ 23592 __ret = (uint16x4_t) __builtin_neon_vqrshrun_n_v((int8x16_t)__s0, __p1, 17); \ 23593 __ret; \ 23594 }) 23595 #else 23596 #define vqrshrun_n_s32(__p0, __p1) __extension__ ({ \ 23597 uint16x4_t __ret; \ 23598 int32x4_t __s0 = __p0; \ 23599 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 23600 __ret = (uint16x4_t) __builtin_neon_vqrshrun_n_v((int8x16_t)__rev0, __p1, 17); \ 23601 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 23602 __ret; \ 23603 }) 23604 #define __noswap_vqrshrun_n_s32(__p0, __p1) __extension__ ({ \ 23605 uint16x4_t __ret; \ 23606 int32x4_t __s0 = __p0; \ 23607 __ret = (uint16x4_t) __builtin_neon_vqrshrun_n_v((int8x16_t)__s0, __p1, 17); \ 23608 __ret; \ 23609 }) 23610 #endif 23611 23612 #ifdef __LITTLE_ENDIAN__ 23613 #define vqrshrun_n_s64(__p0, __p1) __extension__ ({ \ 23614 uint32x2_t __ret; \ 23615 int64x2_t __s0 = __p0; \ 23616 __ret = (uint32x2_t) __builtin_neon_vqrshrun_n_v((int8x16_t)__s0, __p1, 18); \ 23617 __ret; \ 23618 }) 23619 #else 23620 #define vqrshrun_n_s64(__p0, __p1) __extension__ ({ \ 23621 uint32x2_t __ret; \ 23622 int64x2_t __s0 = __p0; \ 23623 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 23624 __ret = (uint32x2_t) __builtin_neon_vqrshrun_n_v((int8x16_t)__rev0, __p1, 18); \ 23625 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 23626 __ret; \ 23627 }) 23628 #define __noswap_vqrshrun_n_s64(__p0, __p1) __extension__ ({ \ 23629 uint32x2_t __ret; \ 23630 int64x2_t __s0 = __p0; \ 23631 __ret = (uint32x2_t) __builtin_neon_vqrshrun_n_v((int8x16_t)__s0, __p1, 18); \ 23632 __ret; \ 23633 }) 23634 #endif 23635 23636 #ifdef __LITTLE_ENDIAN__ 23637 #define vqrshrun_n_s16(__p0, __p1) __extension__ ({ \ 23638 uint8x8_t __ret; \ 23639 int16x8_t __s0 = __p0; \ 23640 __ret = (uint8x8_t) __builtin_neon_vqrshrun_n_v((int8x16_t)__s0, __p1, 16); \ 23641 __ret; \ 23642 }) 23643 #else 23644 #define vqrshrun_n_s16(__p0, __p1) __extension__ ({ \ 23645 uint8x8_t __ret; \ 23646 int16x8_t __s0 = __p0; \ 23647 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 23648 __ret = (uint8x8_t) __builtin_neon_vqrshrun_n_v((int8x16_t)__rev0, __p1, 16); \ 23649 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 23650 __ret; \ 23651 }) 23652 #define __noswap_vqrshrun_n_s16(__p0, __p1) __extension__ ({ \ 23653 uint8x8_t __ret; \ 23654 int16x8_t __s0 = __p0; \ 23655 __ret = (uint8x8_t) __builtin_neon_vqrshrun_n_v((int8x16_t)__s0, __p1, 16); \ 23656 __ret; \ 23657 }) 23658 #endif 23659 23660 #ifdef __LITTLE_ENDIAN__ 23661 __ai __attribute__((target("neon"))) uint8x16_t vqshlq_u8(uint8x16_t __p0, int8x16_t __p1) { 23662 uint8x16_t __ret; 23663 __ret = (uint8x16_t) __builtin_neon_vqshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 48); 23664 return __ret; 23665 } 23666 #else 23667 __ai __attribute__((target("neon"))) uint8x16_t vqshlq_u8(uint8x16_t __p0, int8x16_t __p1) { 23668 uint8x16_t __ret; 23669 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 23670 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 23671 __ret = (uint8x16_t) __builtin_neon_vqshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48); 23672 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 23673 return __ret; 23674 } 23675 #endif 23676 23677 #ifdef __LITTLE_ENDIAN__ 23678 __ai __attribute__((target("neon"))) uint32x4_t vqshlq_u32(uint32x4_t __p0, int32x4_t __p1) { 23679 uint32x4_t __ret; 23680 __ret = (uint32x4_t) __builtin_neon_vqshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 50); 23681 return __ret; 23682 } 23683 #else 23684 __ai __attribute__((target("neon"))) uint32x4_t vqshlq_u32(uint32x4_t __p0, int32x4_t __p1) { 23685 uint32x4_t __ret; 23686 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 23687 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 23688 __ret = (uint32x4_t) __builtin_neon_vqshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50); 23689 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 23690 return __ret; 23691 } 23692 #endif 23693 23694 #ifdef __LITTLE_ENDIAN__ 23695 __ai __attribute__((target("neon"))) uint64x2_t vqshlq_u64(uint64x2_t __p0, int64x2_t __p1) { 23696 uint64x2_t __ret; 23697 __ret = (uint64x2_t) __builtin_neon_vqshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 51); 23698 return __ret; 23699 } 23700 #else 23701 __ai __attribute__((target("neon"))) uint64x2_t vqshlq_u64(uint64x2_t __p0, int64x2_t __p1) { 23702 uint64x2_t __ret; 23703 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 23704 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 23705 __ret = (uint64x2_t) __builtin_neon_vqshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 51); 23706 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 23707 return __ret; 23708 } 23709 #endif 23710 23711 #ifdef __LITTLE_ENDIAN__ 23712 __ai __attribute__((target("neon"))) uint16x8_t vqshlq_u16(uint16x8_t __p0, int16x8_t __p1) { 23713 uint16x8_t __ret; 23714 __ret = (uint16x8_t) __builtin_neon_vqshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 49); 23715 return __ret; 23716 } 23717 #else 23718 __ai __attribute__((target("neon"))) uint16x8_t vqshlq_u16(uint16x8_t __p0, int16x8_t __p1) { 23719 uint16x8_t __ret; 23720 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 23721 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 23722 __ret = (uint16x8_t) __builtin_neon_vqshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49); 23723 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 23724 return __ret; 23725 } 23726 #endif 23727 23728 #ifdef __LITTLE_ENDIAN__ 23729 __ai __attribute__((target("neon"))) int8x16_t vqshlq_s8(int8x16_t __p0, int8x16_t __p1) { 23730 int8x16_t __ret; 23731 __ret = (int8x16_t) __builtin_neon_vqshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 32); 23732 return __ret; 23733 } 23734 #else 23735 __ai __attribute__((target("neon"))) int8x16_t vqshlq_s8(int8x16_t __p0, int8x16_t __p1) { 23736 int8x16_t __ret; 23737 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 23738 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 23739 __ret = (int8x16_t) __builtin_neon_vqshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32); 23740 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 23741 return __ret; 23742 } 23743 #endif 23744 23745 #ifdef __LITTLE_ENDIAN__ 23746 __ai __attribute__((target("neon"))) int32x4_t vqshlq_s32(int32x4_t __p0, int32x4_t __p1) { 23747 int32x4_t __ret; 23748 __ret = (int32x4_t) __builtin_neon_vqshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 34); 23749 return __ret; 23750 } 23751 #else 23752 __ai __attribute__((target("neon"))) int32x4_t vqshlq_s32(int32x4_t __p0, int32x4_t __p1) { 23753 int32x4_t __ret; 23754 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 23755 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 23756 __ret = (int32x4_t) __builtin_neon_vqshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34); 23757 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 23758 return __ret; 23759 } 23760 #endif 23761 23762 #ifdef __LITTLE_ENDIAN__ 23763 __ai __attribute__((target("neon"))) int64x2_t vqshlq_s64(int64x2_t __p0, int64x2_t __p1) { 23764 int64x2_t __ret; 23765 __ret = (int64x2_t) __builtin_neon_vqshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 35); 23766 return __ret; 23767 } 23768 #else 23769 __ai __attribute__((target("neon"))) int64x2_t vqshlq_s64(int64x2_t __p0, int64x2_t __p1) { 23770 int64x2_t __ret; 23771 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 23772 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 23773 __ret = (int64x2_t) __builtin_neon_vqshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 35); 23774 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 23775 return __ret; 23776 } 23777 #endif 23778 23779 #ifdef __LITTLE_ENDIAN__ 23780 __ai __attribute__((target("neon"))) int16x8_t vqshlq_s16(int16x8_t __p0, int16x8_t __p1) { 23781 int16x8_t __ret; 23782 __ret = (int16x8_t) __builtin_neon_vqshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 33); 23783 return __ret; 23784 } 23785 #else 23786 __ai __attribute__((target("neon"))) int16x8_t vqshlq_s16(int16x8_t __p0, int16x8_t __p1) { 23787 int16x8_t __ret; 23788 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 23789 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 23790 __ret = (int16x8_t) __builtin_neon_vqshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33); 23791 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 23792 return __ret; 23793 } 23794 #endif 23795 23796 #ifdef __LITTLE_ENDIAN__ 23797 __ai __attribute__((target("neon"))) uint8x8_t vqshl_u8(uint8x8_t __p0, int8x8_t __p1) { 23798 uint8x8_t __ret; 23799 __ret = (uint8x8_t) __builtin_neon_vqshl_v((int8x8_t)__p0, (int8x8_t)__p1, 16); 23800 return __ret; 23801 } 23802 #else 23803 __ai __attribute__((target("neon"))) uint8x8_t vqshl_u8(uint8x8_t __p0, int8x8_t __p1) { 23804 uint8x8_t __ret; 23805 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 23806 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 23807 __ret = (uint8x8_t) __builtin_neon_vqshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16); 23808 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 23809 return __ret; 23810 } 23811 #endif 23812 23813 #ifdef __LITTLE_ENDIAN__ 23814 __ai __attribute__((target("neon"))) uint32x2_t vqshl_u32(uint32x2_t __p0, int32x2_t __p1) { 23815 uint32x2_t __ret; 23816 __ret = (uint32x2_t) __builtin_neon_vqshl_v((int8x8_t)__p0, (int8x8_t)__p1, 18); 23817 return __ret; 23818 } 23819 #else 23820 __ai __attribute__((target("neon"))) uint32x2_t vqshl_u32(uint32x2_t __p0, int32x2_t __p1) { 23821 uint32x2_t __ret; 23822 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 23823 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 23824 __ret = (uint32x2_t) __builtin_neon_vqshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18); 23825 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 23826 return __ret; 23827 } 23828 #endif 23829 23830 __ai __attribute__((target("neon"))) uint64x1_t vqshl_u64(uint64x1_t __p0, int64x1_t __p1) { 23831 uint64x1_t __ret; 23832 __ret = (uint64x1_t) __builtin_neon_vqshl_v((int8x8_t)__p0, (int8x8_t)__p1, 19); 23833 return __ret; 23834 } 23835 #ifdef __LITTLE_ENDIAN__ 23836 __ai __attribute__((target("neon"))) uint16x4_t vqshl_u16(uint16x4_t __p0, int16x4_t __p1) { 23837 uint16x4_t __ret; 23838 __ret = (uint16x4_t) __builtin_neon_vqshl_v((int8x8_t)__p0, (int8x8_t)__p1, 17); 23839 return __ret; 23840 } 23841 #else 23842 __ai __attribute__((target("neon"))) uint16x4_t vqshl_u16(uint16x4_t __p0, int16x4_t __p1) { 23843 uint16x4_t __ret; 23844 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 23845 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 23846 __ret = (uint16x4_t) __builtin_neon_vqshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17); 23847 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 23848 return __ret; 23849 } 23850 #endif 23851 23852 #ifdef __LITTLE_ENDIAN__ 23853 __ai __attribute__((target("neon"))) int8x8_t vqshl_s8(int8x8_t __p0, int8x8_t __p1) { 23854 int8x8_t __ret; 23855 __ret = (int8x8_t) __builtin_neon_vqshl_v((int8x8_t)__p0, (int8x8_t)__p1, 0); 23856 return __ret; 23857 } 23858 #else 23859 __ai __attribute__((target("neon"))) int8x8_t vqshl_s8(int8x8_t __p0, int8x8_t __p1) { 23860 int8x8_t __ret; 23861 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 23862 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 23863 __ret = (int8x8_t) __builtin_neon_vqshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0); 23864 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 23865 return __ret; 23866 } 23867 #endif 23868 23869 #ifdef __LITTLE_ENDIAN__ 23870 __ai __attribute__((target("neon"))) int32x2_t vqshl_s32(int32x2_t __p0, int32x2_t __p1) { 23871 int32x2_t __ret; 23872 __ret = (int32x2_t) __builtin_neon_vqshl_v((int8x8_t)__p0, (int8x8_t)__p1, 2); 23873 return __ret; 23874 } 23875 #else 23876 __ai __attribute__((target("neon"))) int32x2_t vqshl_s32(int32x2_t __p0, int32x2_t __p1) { 23877 int32x2_t __ret; 23878 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 23879 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 23880 __ret = (int32x2_t) __builtin_neon_vqshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2); 23881 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 23882 return __ret; 23883 } 23884 #endif 23885 23886 __ai __attribute__((target("neon"))) int64x1_t vqshl_s64(int64x1_t __p0, int64x1_t __p1) { 23887 int64x1_t __ret; 23888 __ret = (int64x1_t) __builtin_neon_vqshl_v((int8x8_t)__p0, (int8x8_t)__p1, 3); 23889 return __ret; 23890 } 23891 #ifdef __LITTLE_ENDIAN__ 23892 __ai __attribute__((target("neon"))) int16x4_t vqshl_s16(int16x4_t __p0, int16x4_t __p1) { 23893 int16x4_t __ret; 23894 __ret = (int16x4_t) __builtin_neon_vqshl_v((int8x8_t)__p0, (int8x8_t)__p1, 1); 23895 return __ret; 23896 } 23897 #else 23898 __ai __attribute__((target("neon"))) int16x4_t vqshl_s16(int16x4_t __p0, int16x4_t __p1) { 23899 int16x4_t __ret; 23900 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 23901 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 23902 __ret = (int16x4_t) __builtin_neon_vqshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1); 23903 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 23904 return __ret; 23905 } 23906 #endif 23907 23908 #ifdef __LITTLE_ENDIAN__ 23909 #define vqshlq_n_u8(__p0, __p1) __extension__ ({ \ 23910 uint8x16_t __ret; \ 23911 uint8x16_t __s0 = __p0; \ 23912 __ret = (uint8x16_t) __builtin_neon_vqshlq_n_v((int8x16_t)__s0, __p1, 48); \ 23913 __ret; \ 23914 }) 23915 #else 23916 #define vqshlq_n_u8(__p0, __p1) __extension__ ({ \ 23917 uint8x16_t __ret; \ 23918 uint8x16_t __s0 = __p0; \ 23919 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 23920 __ret = (uint8x16_t) __builtin_neon_vqshlq_n_v((int8x16_t)__rev0, __p1, 48); \ 23921 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 23922 __ret; \ 23923 }) 23924 #endif 23925 23926 #ifdef __LITTLE_ENDIAN__ 23927 #define vqshlq_n_u32(__p0, __p1) __extension__ ({ \ 23928 uint32x4_t __ret; \ 23929 uint32x4_t __s0 = __p0; \ 23930 __ret = (uint32x4_t) __builtin_neon_vqshlq_n_v((int8x16_t)__s0, __p1, 50); \ 23931 __ret; \ 23932 }) 23933 #else 23934 #define vqshlq_n_u32(__p0, __p1) __extension__ ({ \ 23935 uint32x4_t __ret; \ 23936 uint32x4_t __s0 = __p0; \ 23937 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 23938 __ret = (uint32x4_t) __builtin_neon_vqshlq_n_v((int8x16_t)__rev0, __p1, 50); \ 23939 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 23940 __ret; \ 23941 }) 23942 #endif 23943 23944 #ifdef __LITTLE_ENDIAN__ 23945 #define vqshlq_n_u64(__p0, __p1) __extension__ ({ \ 23946 uint64x2_t __ret; \ 23947 uint64x2_t __s0 = __p0; \ 23948 __ret = (uint64x2_t) __builtin_neon_vqshlq_n_v((int8x16_t)__s0, __p1, 51); \ 23949 __ret; \ 23950 }) 23951 #else 23952 #define vqshlq_n_u64(__p0, __p1) __extension__ ({ \ 23953 uint64x2_t __ret; \ 23954 uint64x2_t __s0 = __p0; \ 23955 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 23956 __ret = (uint64x2_t) __builtin_neon_vqshlq_n_v((int8x16_t)__rev0, __p1, 51); \ 23957 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 23958 __ret; \ 23959 }) 23960 #endif 23961 23962 #ifdef __LITTLE_ENDIAN__ 23963 #define vqshlq_n_u16(__p0, __p1) __extension__ ({ \ 23964 uint16x8_t __ret; \ 23965 uint16x8_t __s0 = __p0; \ 23966 __ret = (uint16x8_t) __builtin_neon_vqshlq_n_v((int8x16_t)__s0, __p1, 49); \ 23967 __ret; \ 23968 }) 23969 #else 23970 #define vqshlq_n_u16(__p0, __p1) __extension__ ({ \ 23971 uint16x8_t __ret; \ 23972 uint16x8_t __s0 = __p0; \ 23973 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 23974 __ret = (uint16x8_t) __builtin_neon_vqshlq_n_v((int8x16_t)__rev0, __p1, 49); \ 23975 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 23976 __ret; \ 23977 }) 23978 #endif 23979 23980 #ifdef __LITTLE_ENDIAN__ 23981 #define vqshlq_n_s8(__p0, __p1) __extension__ ({ \ 23982 int8x16_t __ret; \ 23983 int8x16_t __s0 = __p0; \ 23984 __ret = (int8x16_t) __builtin_neon_vqshlq_n_v((int8x16_t)__s0, __p1, 32); \ 23985 __ret; \ 23986 }) 23987 #else 23988 #define vqshlq_n_s8(__p0, __p1) __extension__ ({ \ 23989 int8x16_t __ret; \ 23990 int8x16_t __s0 = __p0; \ 23991 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 23992 __ret = (int8x16_t) __builtin_neon_vqshlq_n_v((int8x16_t)__rev0, __p1, 32); \ 23993 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 23994 __ret; \ 23995 }) 23996 #endif 23997 23998 #ifdef __LITTLE_ENDIAN__ 23999 #define vqshlq_n_s32(__p0, __p1) __extension__ ({ \ 24000 int32x4_t __ret; \ 24001 int32x4_t __s0 = __p0; \ 24002 __ret = (int32x4_t) __builtin_neon_vqshlq_n_v((int8x16_t)__s0, __p1, 34); \ 24003 __ret; \ 24004 }) 24005 #else 24006 #define vqshlq_n_s32(__p0, __p1) __extension__ ({ \ 24007 int32x4_t __ret; \ 24008 int32x4_t __s0 = __p0; \ 24009 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 24010 __ret = (int32x4_t) __builtin_neon_vqshlq_n_v((int8x16_t)__rev0, __p1, 34); \ 24011 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 24012 __ret; \ 24013 }) 24014 #endif 24015 24016 #ifdef __LITTLE_ENDIAN__ 24017 #define vqshlq_n_s64(__p0, __p1) __extension__ ({ \ 24018 int64x2_t __ret; \ 24019 int64x2_t __s0 = __p0; \ 24020 __ret = (int64x2_t) __builtin_neon_vqshlq_n_v((int8x16_t)__s0, __p1, 35); \ 24021 __ret; \ 24022 }) 24023 #else 24024 #define vqshlq_n_s64(__p0, __p1) __extension__ ({ \ 24025 int64x2_t __ret; \ 24026 int64x2_t __s0 = __p0; \ 24027 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 24028 __ret = (int64x2_t) __builtin_neon_vqshlq_n_v((int8x16_t)__rev0, __p1, 35); \ 24029 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 24030 __ret; \ 24031 }) 24032 #endif 24033 24034 #ifdef __LITTLE_ENDIAN__ 24035 #define vqshlq_n_s16(__p0, __p1) __extension__ ({ \ 24036 int16x8_t __ret; \ 24037 int16x8_t __s0 = __p0; \ 24038 __ret = (int16x8_t) __builtin_neon_vqshlq_n_v((int8x16_t)__s0, __p1, 33); \ 24039 __ret; \ 24040 }) 24041 #else 24042 #define vqshlq_n_s16(__p0, __p1) __extension__ ({ \ 24043 int16x8_t __ret; \ 24044 int16x8_t __s0 = __p0; \ 24045 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 24046 __ret = (int16x8_t) __builtin_neon_vqshlq_n_v((int8x16_t)__rev0, __p1, 33); \ 24047 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 24048 __ret; \ 24049 }) 24050 #endif 24051 24052 #ifdef __LITTLE_ENDIAN__ 24053 #define vqshl_n_u8(__p0, __p1) __extension__ ({ \ 24054 uint8x8_t __ret; \ 24055 uint8x8_t __s0 = __p0; \ 24056 __ret = (uint8x8_t) __builtin_neon_vqshl_n_v((int8x8_t)__s0, __p1, 16); \ 24057 __ret; \ 24058 }) 24059 #else 24060 #define vqshl_n_u8(__p0, __p1) __extension__ ({ \ 24061 uint8x8_t __ret; \ 24062 uint8x8_t __s0 = __p0; \ 24063 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 24064 __ret = (uint8x8_t) __builtin_neon_vqshl_n_v((int8x8_t)__rev0, __p1, 16); \ 24065 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 24066 __ret; \ 24067 }) 24068 #endif 24069 24070 #ifdef __LITTLE_ENDIAN__ 24071 #define vqshl_n_u32(__p0, __p1) __extension__ ({ \ 24072 uint32x2_t __ret; \ 24073 uint32x2_t __s0 = __p0; \ 24074 __ret = (uint32x2_t) __builtin_neon_vqshl_n_v((int8x8_t)__s0, __p1, 18); \ 24075 __ret; \ 24076 }) 24077 #else 24078 #define vqshl_n_u32(__p0, __p1) __extension__ ({ \ 24079 uint32x2_t __ret; \ 24080 uint32x2_t __s0 = __p0; \ 24081 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 24082 __ret = (uint32x2_t) __builtin_neon_vqshl_n_v((int8x8_t)__rev0, __p1, 18); \ 24083 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 24084 __ret; \ 24085 }) 24086 #endif 24087 24088 #define vqshl_n_u64(__p0, __p1) __extension__ ({ \ 24089 uint64x1_t __ret; \ 24090 uint64x1_t __s0 = __p0; \ 24091 __ret = (uint64x1_t) __builtin_neon_vqshl_n_v((int8x8_t)__s0, __p1, 19); \ 24092 __ret; \ 24093 }) 24094 #ifdef __LITTLE_ENDIAN__ 24095 #define vqshl_n_u16(__p0, __p1) __extension__ ({ \ 24096 uint16x4_t __ret; \ 24097 uint16x4_t __s0 = __p0; \ 24098 __ret = (uint16x4_t) __builtin_neon_vqshl_n_v((int8x8_t)__s0, __p1, 17); \ 24099 __ret; \ 24100 }) 24101 #else 24102 #define vqshl_n_u16(__p0, __p1) __extension__ ({ \ 24103 uint16x4_t __ret; \ 24104 uint16x4_t __s0 = __p0; \ 24105 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 24106 __ret = (uint16x4_t) __builtin_neon_vqshl_n_v((int8x8_t)__rev0, __p1, 17); \ 24107 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 24108 __ret; \ 24109 }) 24110 #endif 24111 24112 #ifdef __LITTLE_ENDIAN__ 24113 #define vqshl_n_s8(__p0, __p1) __extension__ ({ \ 24114 int8x8_t __ret; \ 24115 int8x8_t __s0 = __p0; \ 24116 __ret = (int8x8_t) __builtin_neon_vqshl_n_v((int8x8_t)__s0, __p1, 0); \ 24117 __ret; \ 24118 }) 24119 #else 24120 #define vqshl_n_s8(__p0, __p1) __extension__ ({ \ 24121 int8x8_t __ret; \ 24122 int8x8_t __s0 = __p0; \ 24123 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 24124 __ret = (int8x8_t) __builtin_neon_vqshl_n_v((int8x8_t)__rev0, __p1, 0); \ 24125 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 24126 __ret; \ 24127 }) 24128 #endif 24129 24130 #ifdef __LITTLE_ENDIAN__ 24131 #define vqshl_n_s32(__p0, __p1) __extension__ ({ \ 24132 int32x2_t __ret; \ 24133 int32x2_t __s0 = __p0; \ 24134 __ret = (int32x2_t) __builtin_neon_vqshl_n_v((int8x8_t)__s0, __p1, 2); \ 24135 __ret; \ 24136 }) 24137 #else 24138 #define vqshl_n_s32(__p0, __p1) __extension__ ({ \ 24139 int32x2_t __ret; \ 24140 int32x2_t __s0 = __p0; \ 24141 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 24142 __ret = (int32x2_t) __builtin_neon_vqshl_n_v((int8x8_t)__rev0, __p1, 2); \ 24143 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 24144 __ret; \ 24145 }) 24146 #endif 24147 24148 #define vqshl_n_s64(__p0, __p1) __extension__ ({ \ 24149 int64x1_t __ret; \ 24150 int64x1_t __s0 = __p0; \ 24151 __ret = (int64x1_t) __builtin_neon_vqshl_n_v((int8x8_t)__s0, __p1, 3); \ 24152 __ret; \ 24153 }) 24154 #ifdef __LITTLE_ENDIAN__ 24155 #define vqshl_n_s16(__p0, __p1) __extension__ ({ \ 24156 int16x4_t __ret; \ 24157 int16x4_t __s0 = __p0; \ 24158 __ret = (int16x4_t) __builtin_neon_vqshl_n_v((int8x8_t)__s0, __p1, 1); \ 24159 __ret; \ 24160 }) 24161 #else 24162 #define vqshl_n_s16(__p0, __p1) __extension__ ({ \ 24163 int16x4_t __ret; \ 24164 int16x4_t __s0 = __p0; \ 24165 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 24166 __ret = (int16x4_t) __builtin_neon_vqshl_n_v((int8x8_t)__rev0, __p1, 1); \ 24167 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 24168 __ret; \ 24169 }) 24170 #endif 24171 24172 #ifdef __LITTLE_ENDIAN__ 24173 #define vqshluq_n_s8(__p0, __p1) __extension__ ({ \ 24174 uint8x16_t __ret; \ 24175 int8x16_t __s0 = __p0; \ 24176 __ret = (uint8x16_t) __builtin_neon_vqshluq_n_v((int8x16_t)__s0, __p1, 48); \ 24177 __ret; \ 24178 }) 24179 #else 24180 #define vqshluq_n_s8(__p0, __p1) __extension__ ({ \ 24181 uint8x16_t __ret; \ 24182 int8x16_t __s0 = __p0; \ 24183 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 24184 __ret = (uint8x16_t) __builtin_neon_vqshluq_n_v((int8x16_t)__rev0, __p1, 48); \ 24185 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 24186 __ret; \ 24187 }) 24188 #endif 24189 24190 #ifdef __LITTLE_ENDIAN__ 24191 #define vqshluq_n_s32(__p0, __p1) __extension__ ({ \ 24192 uint32x4_t __ret; \ 24193 int32x4_t __s0 = __p0; \ 24194 __ret = (uint32x4_t) __builtin_neon_vqshluq_n_v((int8x16_t)__s0, __p1, 50); \ 24195 __ret; \ 24196 }) 24197 #else 24198 #define vqshluq_n_s32(__p0, __p1) __extension__ ({ \ 24199 uint32x4_t __ret; \ 24200 int32x4_t __s0 = __p0; \ 24201 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 24202 __ret = (uint32x4_t) __builtin_neon_vqshluq_n_v((int8x16_t)__rev0, __p1, 50); \ 24203 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 24204 __ret; \ 24205 }) 24206 #endif 24207 24208 #ifdef __LITTLE_ENDIAN__ 24209 #define vqshluq_n_s64(__p0, __p1) __extension__ ({ \ 24210 uint64x2_t __ret; \ 24211 int64x2_t __s0 = __p0; \ 24212 __ret = (uint64x2_t) __builtin_neon_vqshluq_n_v((int8x16_t)__s0, __p1, 51); \ 24213 __ret; \ 24214 }) 24215 #else 24216 #define vqshluq_n_s64(__p0, __p1) __extension__ ({ \ 24217 uint64x2_t __ret; \ 24218 int64x2_t __s0 = __p0; \ 24219 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 24220 __ret = (uint64x2_t) __builtin_neon_vqshluq_n_v((int8x16_t)__rev0, __p1, 51); \ 24221 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 24222 __ret; \ 24223 }) 24224 #endif 24225 24226 #ifdef __LITTLE_ENDIAN__ 24227 #define vqshluq_n_s16(__p0, __p1) __extension__ ({ \ 24228 uint16x8_t __ret; \ 24229 int16x8_t __s0 = __p0; \ 24230 __ret = (uint16x8_t) __builtin_neon_vqshluq_n_v((int8x16_t)__s0, __p1, 49); \ 24231 __ret; \ 24232 }) 24233 #else 24234 #define vqshluq_n_s16(__p0, __p1) __extension__ ({ \ 24235 uint16x8_t __ret; \ 24236 int16x8_t __s0 = __p0; \ 24237 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 24238 __ret = (uint16x8_t) __builtin_neon_vqshluq_n_v((int8x16_t)__rev0, __p1, 49); \ 24239 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 24240 __ret; \ 24241 }) 24242 #endif 24243 24244 #ifdef __LITTLE_ENDIAN__ 24245 #define vqshlu_n_s8(__p0, __p1) __extension__ ({ \ 24246 uint8x8_t __ret; \ 24247 int8x8_t __s0 = __p0; \ 24248 __ret = (uint8x8_t) __builtin_neon_vqshlu_n_v((int8x8_t)__s0, __p1, 16); \ 24249 __ret; \ 24250 }) 24251 #else 24252 #define vqshlu_n_s8(__p0, __p1) __extension__ ({ \ 24253 uint8x8_t __ret; \ 24254 int8x8_t __s0 = __p0; \ 24255 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 24256 __ret = (uint8x8_t) __builtin_neon_vqshlu_n_v((int8x8_t)__rev0, __p1, 16); \ 24257 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 24258 __ret; \ 24259 }) 24260 #endif 24261 24262 #ifdef __LITTLE_ENDIAN__ 24263 #define vqshlu_n_s32(__p0, __p1) __extension__ ({ \ 24264 uint32x2_t __ret; \ 24265 int32x2_t __s0 = __p0; \ 24266 __ret = (uint32x2_t) __builtin_neon_vqshlu_n_v((int8x8_t)__s0, __p1, 18); \ 24267 __ret; \ 24268 }) 24269 #else 24270 #define vqshlu_n_s32(__p0, __p1) __extension__ ({ \ 24271 uint32x2_t __ret; \ 24272 int32x2_t __s0 = __p0; \ 24273 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 24274 __ret = (uint32x2_t) __builtin_neon_vqshlu_n_v((int8x8_t)__rev0, __p1, 18); \ 24275 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 24276 __ret; \ 24277 }) 24278 #endif 24279 24280 #define vqshlu_n_s64(__p0, __p1) __extension__ ({ \ 24281 uint64x1_t __ret; \ 24282 int64x1_t __s0 = __p0; \ 24283 __ret = (uint64x1_t) __builtin_neon_vqshlu_n_v((int8x8_t)__s0, __p1, 19); \ 24284 __ret; \ 24285 }) 24286 #ifdef __LITTLE_ENDIAN__ 24287 #define vqshlu_n_s16(__p0, __p1) __extension__ ({ \ 24288 uint16x4_t __ret; \ 24289 int16x4_t __s0 = __p0; \ 24290 __ret = (uint16x4_t) __builtin_neon_vqshlu_n_v((int8x8_t)__s0, __p1, 17); \ 24291 __ret; \ 24292 }) 24293 #else 24294 #define vqshlu_n_s16(__p0, __p1) __extension__ ({ \ 24295 uint16x4_t __ret; \ 24296 int16x4_t __s0 = __p0; \ 24297 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 24298 __ret = (uint16x4_t) __builtin_neon_vqshlu_n_v((int8x8_t)__rev0, __p1, 17); \ 24299 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 24300 __ret; \ 24301 }) 24302 #endif 24303 24304 #ifdef __LITTLE_ENDIAN__ 24305 #define vqshrn_n_u32(__p0, __p1) __extension__ ({ \ 24306 uint16x4_t __ret; \ 24307 uint32x4_t __s0 = __p0; \ 24308 __ret = (uint16x4_t) __builtin_neon_vqshrn_n_v((int8x16_t)__s0, __p1, 17); \ 24309 __ret; \ 24310 }) 24311 #else 24312 #define vqshrn_n_u32(__p0, __p1) __extension__ ({ \ 24313 uint16x4_t __ret; \ 24314 uint32x4_t __s0 = __p0; \ 24315 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 24316 __ret = (uint16x4_t) __builtin_neon_vqshrn_n_v((int8x16_t)__rev0, __p1, 17); \ 24317 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 24318 __ret; \ 24319 }) 24320 #define __noswap_vqshrn_n_u32(__p0, __p1) __extension__ ({ \ 24321 uint16x4_t __ret; \ 24322 uint32x4_t __s0 = __p0; \ 24323 __ret = (uint16x4_t) __builtin_neon_vqshrn_n_v((int8x16_t)__s0, __p1, 17); \ 24324 __ret; \ 24325 }) 24326 #endif 24327 24328 #ifdef __LITTLE_ENDIAN__ 24329 #define vqshrn_n_u64(__p0, __p1) __extension__ ({ \ 24330 uint32x2_t __ret; \ 24331 uint64x2_t __s0 = __p0; \ 24332 __ret = (uint32x2_t) __builtin_neon_vqshrn_n_v((int8x16_t)__s0, __p1, 18); \ 24333 __ret; \ 24334 }) 24335 #else 24336 #define vqshrn_n_u64(__p0, __p1) __extension__ ({ \ 24337 uint32x2_t __ret; \ 24338 uint64x2_t __s0 = __p0; \ 24339 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 24340 __ret = (uint32x2_t) __builtin_neon_vqshrn_n_v((int8x16_t)__rev0, __p1, 18); \ 24341 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 24342 __ret; \ 24343 }) 24344 #define __noswap_vqshrn_n_u64(__p0, __p1) __extension__ ({ \ 24345 uint32x2_t __ret; \ 24346 uint64x2_t __s0 = __p0; \ 24347 __ret = (uint32x2_t) __builtin_neon_vqshrn_n_v((int8x16_t)__s0, __p1, 18); \ 24348 __ret; \ 24349 }) 24350 #endif 24351 24352 #ifdef __LITTLE_ENDIAN__ 24353 #define vqshrn_n_u16(__p0, __p1) __extension__ ({ \ 24354 uint8x8_t __ret; \ 24355 uint16x8_t __s0 = __p0; \ 24356 __ret = (uint8x8_t) __builtin_neon_vqshrn_n_v((int8x16_t)__s0, __p1, 16); \ 24357 __ret; \ 24358 }) 24359 #else 24360 #define vqshrn_n_u16(__p0, __p1) __extension__ ({ \ 24361 uint8x8_t __ret; \ 24362 uint16x8_t __s0 = __p0; \ 24363 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 24364 __ret = (uint8x8_t) __builtin_neon_vqshrn_n_v((int8x16_t)__rev0, __p1, 16); \ 24365 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 24366 __ret; \ 24367 }) 24368 #define __noswap_vqshrn_n_u16(__p0, __p1) __extension__ ({ \ 24369 uint8x8_t __ret; \ 24370 uint16x8_t __s0 = __p0; \ 24371 __ret = (uint8x8_t) __builtin_neon_vqshrn_n_v((int8x16_t)__s0, __p1, 16); \ 24372 __ret; \ 24373 }) 24374 #endif 24375 24376 #ifdef __LITTLE_ENDIAN__ 24377 #define vqshrn_n_s32(__p0, __p1) __extension__ ({ \ 24378 int16x4_t __ret; \ 24379 int32x4_t __s0 = __p0; \ 24380 __ret = (int16x4_t) __builtin_neon_vqshrn_n_v((int8x16_t)__s0, __p1, 1); \ 24381 __ret; \ 24382 }) 24383 #else 24384 #define vqshrn_n_s32(__p0, __p1) __extension__ ({ \ 24385 int16x4_t __ret; \ 24386 int32x4_t __s0 = __p0; \ 24387 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 24388 __ret = (int16x4_t) __builtin_neon_vqshrn_n_v((int8x16_t)__rev0, __p1, 1); \ 24389 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 24390 __ret; \ 24391 }) 24392 #define __noswap_vqshrn_n_s32(__p0, __p1) __extension__ ({ \ 24393 int16x4_t __ret; \ 24394 int32x4_t __s0 = __p0; \ 24395 __ret = (int16x4_t) __builtin_neon_vqshrn_n_v((int8x16_t)__s0, __p1, 1); \ 24396 __ret; \ 24397 }) 24398 #endif 24399 24400 #ifdef __LITTLE_ENDIAN__ 24401 #define vqshrn_n_s64(__p0, __p1) __extension__ ({ \ 24402 int32x2_t __ret; \ 24403 int64x2_t __s0 = __p0; \ 24404 __ret = (int32x2_t) __builtin_neon_vqshrn_n_v((int8x16_t)__s0, __p1, 2); \ 24405 __ret; \ 24406 }) 24407 #else 24408 #define vqshrn_n_s64(__p0, __p1) __extension__ ({ \ 24409 int32x2_t __ret; \ 24410 int64x2_t __s0 = __p0; \ 24411 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 24412 __ret = (int32x2_t) __builtin_neon_vqshrn_n_v((int8x16_t)__rev0, __p1, 2); \ 24413 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 24414 __ret; \ 24415 }) 24416 #define __noswap_vqshrn_n_s64(__p0, __p1) __extension__ ({ \ 24417 int32x2_t __ret; \ 24418 int64x2_t __s0 = __p0; \ 24419 __ret = (int32x2_t) __builtin_neon_vqshrn_n_v((int8x16_t)__s0, __p1, 2); \ 24420 __ret; \ 24421 }) 24422 #endif 24423 24424 #ifdef __LITTLE_ENDIAN__ 24425 #define vqshrn_n_s16(__p0, __p1) __extension__ ({ \ 24426 int8x8_t __ret; \ 24427 int16x8_t __s0 = __p0; \ 24428 __ret = (int8x8_t) __builtin_neon_vqshrn_n_v((int8x16_t)__s0, __p1, 0); \ 24429 __ret; \ 24430 }) 24431 #else 24432 #define vqshrn_n_s16(__p0, __p1) __extension__ ({ \ 24433 int8x8_t __ret; \ 24434 int16x8_t __s0 = __p0; \ 24435 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 24436 __ret = (int8x8_t) __builtin_neon_vqshrn_n_v((int8x16_t)__rev0, __p1, 0); \ 24437 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 24438 __ret; \ 24439 }) 24440 #define __noswap_vqshrn_n_s16(__p0, __p1) __extension__ ({ \ 24441 int8x8_t __ret; \ 24442 int16x8_t __s0 = __p0; \ 24443 __ret = (int8x8_t) __builtin_neon_vqshrn_n_v((int8x16_t)__s0, __p1, 0); \ 24444 __ret; \ 24445 }) 24446 #endif 24447 24448 #ifdef __LITTLE_ENDIAN__ 24449 #define vqshrun_n_s32(__p0, __p1) __extension__ ({ \ 24450 uint16x4_t __ret; \ 24451 int32x4_t __s0 = __p0; \ 24452 __ret = (uint16x4_t) __builtin_neon_vqshrun_n_v((int8x16_t)__s0, __p1, 17); \ 24453 __ret; \ 24454 }) 24455 #else 24456 #define vqshrun_n_s32(__p0, __p1) __extension__ ({ \ 24457 uint16x4_t __ret; \ 24458 int32x4_t __s0 = __p0; \ 24459 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 24460 __ret = (uint16x4_t) __builtin_neon_vqshrun_n_v((int8x16_t)__rev0, __p1, 17); \ 24461 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 24462 __ret; \ 24463 }) 24464 #define __noswap_vqshrun_n_s32(__p0, __p1) __extension__ ({ \ 24465 uint16x4_t __ret; \ 24466 int32x4_t __s0 = __p0; \ 24467 __ret = (uint16x4_t) __builtin_neon_vqshrun_n_v((int8x16_t)__s0, __p1, 17); \ 24468 __ret; \ 24469 }) 24470 #endif 24471 24472 #ifdef __LITTLE_ENDIAN__ 24473 #define vqshrun_n_s64(__p0, __p1) __extension__ ({ \ 24474 uint32x2_t __ret; \ 24475 int64x2_t __s0 = __p0; \ 24476 __ret = (uint32x2_t) __builtin_neon_vqshrun_n_v((int8x16_t)__s0, __p1, 18); \ 24477 __ret; \ 24478 }) 24479 #else 24480 #define vqshrun_n_s64(__p0, __p1) __extension__ ({ \ 24481 uint32x2_t __ret; \ 24482 int64x2_t __s0 = __p0; \ 24483 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 24484 __ret = (uint32x2_t) __builtin_neon_vqshrun_n_v((int8x16_t)__rev0, __p1, 18); \ 24485 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 24486 __ret; \ 24487 }) 24488 #define __noswap_vqshrun_n_s64(__p0, __p1) __extension__ ({ \ 24489 uint32x2_t __ret; \ 24490 int64x2_t __s0 = __p0; \ 24491 __ret = (uint32x2_t) __builtin_neon_vqshrun_n_v((int8x16_t)__s0, __p1, 18); \ 24492 __ret; \ 24493 }) 24494 #endif 24495 24496 #ifdef __LITTLE_ENDIAN__ 24497 #define vqshrun_n_s16(__p0, __p1) __extension__ ({ \ 24498 uint8x8_t __ret; \ 24499 int16x8_t __s0 = __p0; \ 24500 __ret = (uint8x8_t) __builtin_neon_vqshrun_n_v((int8x16_t)__s0, __p1, 16); \ 24501 __ret; \ 24502 }) 24503 #else 24504 #define vqshrun_n_s16(__p0, __p1) __extension__ ({ \ 24505 uint8x8_t __ret; \ 24506 int16x8_t __s0 = __p0; \ 24507 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 24508 __ret = (uint8x8_t) __builtin_neon_vqshrun_n_v((int8x16_t)__rev0, __p1, 16); \ 24509 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 24510 __ret; \ 24511 }) 24512 #define __noswap_vqshrun_n_s16(__p0, __p1) __extension__ ({ \ 24513 uint8x8_t __ret; \ 24514 int16x8_t __s0 = __p0; \ 24515 __ret = (uint8x8_t) __builtin_neon_vqshrun_n_v((int8x16_t)__s0, __p1, 16); \ 24516 __ret; \ 24517 }) 24518 #endif 24519 24520 #ifdef __LITTLE_ENDIAN__ 24521 __ai __attribute__((target("neon"))) uint8x16_t vqsubq_u8(uint8x16_t __p0, uint8x16_t __p1) { 24522 uint8x16_t __ret; 24523 __ret = (uint8x16_t) __builtin_neon_vqsubq_v((int8x16_t)__p0, (int8x16_t)__p1, 48); 24524 return __ret; 24525 } 24526 #else 24527 __ai __attribute__((target("neon"))) uint8x16_t vqsubq_u8(uint8x16_t __p0, uint8x16_t __p1) { 24528 uint8x16_t __ret; 24529 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 24530 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 24531 __ret = (uint8x16_t) __builtin_neon_vqsubq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48); 24532 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 24533 return __ret; 24534 } 24535 #endif 24536 24537 #ifdef __LITTLE_ENDIAN__ 24538 __ai __attribute__((target("neon"))) uint32x4_t vqsubq_u32(uint32x4_t __p0, uint32x4_t __p1) { 24539 uint32x4_t __ret; 24540 __ret = (uint32x4_t) __builtin_neon_vqsubq_v((int8x16_t)__p0, (int8x16_t)__p1, 50); 24541 return __ret; 24542 } 24543 #else 24544 __ai __attribute__((target("neon"))) uint32x4_t vqsubq_u32(uint32x4_t __p0, uint32x4_t __p1) { 24545 uint32x4_t __ret; 24546 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 24547 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 24548 __ret = (uint32x4_t) __builtin_neon_vqsubq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50); 24549 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 24550 return __ret; 24551 } 24552 #endif 24553 24554 #ifdef __LITTLE_ENDIAN__ 24555 __ai __attribute__((target("neon"))) uint64x2_t vqsubq_u64(uint64x2_t __p0, uint64x2_t __p1) { 24556 uint64x2_t __ret; 24557 __ret = (uint64x2_t) __builtin_neon_vqsubq_v((int8x16_t)__p0, (int8x16_t)__p1, 51); 24558 return __ret; 24559 } 24560 #else 24561 __ai __attribute__((target("neon"))) uint64x2_t vqsubq_u64(uint64x2_t __p0, uint64x2_t __p1) { 24562 uint64x2_t __ret; 24563 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 24564 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 24565 __ret = (uint64x2_t) __builtin_neon_vqsubq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 51); 24566 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 24567 return __ret; 24568 } 24569 #endif 24570 24571 #ifdef __LITTLE_ENDIAN__ 24572 __ai __attribute__((target("neon"))) uint16x8_t vqsubq_u16(uint16x8_t __p0, uint16x8_t __p1) { 24573 uint16x8_t __ret; 24574 __ret = (uint16x8_t) __builtin_neon_vqsubq_v((int8x16_t)__p0, (int8x16_t)__p1, 49); 24575 return __ret; 24576 } 24577 #else 24578 __ai __attribute__((target("neon"))) uint16x8_t vqsubq_u16(uint16x8_t __p0, uint16x8_t __p1) { 24579 uint16x8_t __ret; 24580 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 24581 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 24582 __ret = (uint16x8_t) __builtin_neon_vqsubq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49); 24583 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 24584 return __ret; 24585 } 24586 #endif 24587 24588 #ifdef __LITTLE_ENDIAN__ 24589 __ai __attribute__((target("neon"))) int8x16_t vqsubq_s8(int8x16_t __p0, int8x16_t __p1) { 24590 int8x16_t __ret; 24591 __ret = (int8x16_t) __builtin_neon_vqsubq_v((int8x16_t)__p0, (int8x16_t)__p1, 32); 24592 return __ret; 24593 } 24594 #else 24595 __ai __attribute__((target("neon"))) int8x16_t vqsubq_s8(int8x16_t __p0, int8x16_t __p1) { 24596 int8x16_t __ret; 24597 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 24598 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 24599 __ret = (int8x16_t) __builtin_neon_vqsubq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32); 24600 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 24601 return __ret; 24602 } 24603 #endif 24604 24605 #ifdef __LITTLE_ENDIAN__ 24606 __ai __attribute__((target("neon"))) int32x4_t vqsubq_s32(int32x4_t __p0, int32x4_t __p1) { 24607 int32x4_t __ret; 24608 __ret = (int32x4_t) __builtin_neon_vqsubq_v((int8x16_t)__p0, (int8x16_t)__p1, 34); 24609 return __ret; 24610 } 24611 #else 24612 __ai __attribute__((target("neon"))) int32x4_t vqsubq_s32(int32x4_t __p0, int32x4_t __p1) { 24613 int32x4_t __ret; 24614 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 24615 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 24616 __ret = (int32x4_t) __builtin_neon_vqsubq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34); 24617 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 24618 return __ret; 24619 } 24620 #endif 24621 24622 #ifdef __LITTLE_ENDIAN__ 24623 __ai __attribute__((target("neon"))) int64x2_t vqsubq_s64(int64x2_t __p0, int64x2_t __p1) { 24624 int64x2_t __ret; 24625 __ret = (int64x2_t) __builtin_neon_vqsubq_v((int8x16_t)__p0, (int8x16_t)__p1, 35); 24626 return __ret; 24627 } 24628 #else 24629 __ai __attribute__((target("neon"))) int64x2_t vqsubq_s64(int64x2_t __p0, int64x2_t __p1) { 24630 int64x2_t __ret; 24631 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 24632 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 24633 __ret = (int64x2_t) __builtin_neon_vqsubq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 35); 24634 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 24635 return __ret; 24636 } 24637 #endif 24638 24639 #ifdef __LITTLE_ENDIAN__ 24640 __ai __attribute__((target("neon"))) int16x8_t vqsubq_s16(int16x8_t __p0, int16x8_t __p1) { 24641 int16x8_t __ret; 24642 __ret = (int16x8_t) __builtin_neon_vqsubq_v((int8x16_t)__p0, (int8x16_t)__p1, 33); 24643 return __ret; 24644 } 24645 #else 24646 __ai __attribute__((target("neon"))) int16x8_t vqsubq_s16(int16x8_t __p0, int16x8_t __p1) { 24647 int16x8_t __ret; 24648 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 24649 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 24650 __ret = (int16x8_t) __builtin_neon_vqsubq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33); 24651 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 24652 return __ret; 24653 } 24654 #endif 24655 24656 #ifdef __LITTLE_ENDIAN__ 24657 __ai __attribute__((target("neon"))) uint8x8_t vqsub_u8(uint8x8_t __p0, uint8x8_t __p1) { 24658 uint8x8_t __ret; 24659 __ret = (uint8x8_t) __builtin_neon_vqsub_v((int8x8_t)__p0, (int8x8_t)__p1, 16); 24660 return __ret; 24661 } 24662 #else 24663 __ai __attribute__((target("neon"))) uint8x8_t vqsub_u8(uint8x8_t __p0, uint8x8_t __p1) { 24664 uint8x8_t __ret; 24665 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 24666 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 24667 __ret = (uint8x8_t) __builtin_neon_vqsub_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16); 24668 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 24669 return __ret; 24670 } 24671 #endif 24672 24673 #ifdef __LITTLE_ENDIAN__ 24674 __ai __attribute__((target("neon"))) uint32x2_t vqsub_u32(uint32x2_t __p0, uint32x2_t __p1) { 24675 uint32x2_t __ret; 24676 __ret = (uint32x2_t) __builtin_neon_vqsub_v((int8x8_t)__p0, (int8x8_t)__p1, 18); 24677 return __ret; 24678 } 24679 #else 24680 __ai __attribute__((target("neon"))) uint32x2_t vqsub_u32(uint32x2_t __p0, uint32x2_t __p1) { 24681 uint32x2_t __ret; 24682 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 24683 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 24684 __ret = (uint32x2_t) __builtin_neon_vqsub_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18); 24685 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 24686 return __ret; 24687 } 24688 #endif 24689 24690 __ai __attribute__((target("neon"))) uint64x1_t vqsub_u64(uint64x1_t __p0, uint64x1_t __p1) { 24691 uint64x1_t __ret; 24692 __ret = (uint64x1_t) __builtin_neon_vqsub_v((int8x8_t)__p0, (int8x8_t)__p1, 19); 24693 return __ret; 24694 } 24695 #ifdef __LITTLE_ENDIAN__ 24696 __ai __attribute__((target("neon"))) uint16x4_t vqsub_u16(uint16x4_t __p0, uint16x4_t __p1) { 24697 uint16x4_t __ret; 24698 __ret = (uint16x4_t) __builtin_neon_vqsub_v((int8x8_t)__p0, (int8x8_t)__p1, 17); 24699 return __ret; 24700 } 24701 #else 24702 __ai __attribute__((target("neon"))) uint16x4_t vqsub_u16(uint16x4_t __p0, uint16x4_t __p1) { 24703 uint16x4_t __ret; 24704 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 24705 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 24706 __ret = (uint16x4_t) __builtin_neon_vqsub_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17); 24707 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 24708 return __ret; 24709 } 24710 #endif 24711 24712 #ifdef __LITTLE_ENDIAN__ 24713 __ai __attribute__((target("neon"))) int8x8_t vqsub_s8(int8x8_t __p0, int8x8_t __p1) { 24714 int8x8_t __ret; 24715 __ret = (int8x8_t) __builtin_neon_vqsub_v((int8x8_t)__p0, (int8x8_t)__p1, 0); 24716 return __ret; 24717 } 24718 #else 24719 __ai __attribute__((target("neon"))) int8x8_t vqsub_s8(int8x8_t __p0, int8x8_t __p1) { 24720 int8x8_t __ret; 24721 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 24722 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 24723 __ret = (int8x8_t) __builtin_neon_vqsub_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0); 24724 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 24725 return __ret; 24726 } 24727 #endif 24728 24729 #ifdef __LITTLE_ENDIAN__ 24730 __ai __attribute__((target("neon"))) int32x2_t vqsub_s32(int32x2_t __p0, int32x2_t __p1) { 24731 int32x2_t __ret; 24732 __ret = (int32x2_t) __builtin_neon_vqsub_v((int8x8_t)__p0, (int8x8_t)__p1, 2); 24733 return __ret; 24734 } 24735 #else 24736 __ai __attribute__((target("neon"))) int32x2_t vqsub_s32(int32x2_t __p0, int32x2_t __p1) { 24737 int32x2_t __ret; 24738 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 24739 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 24740 __ret = (int32x2_t) __builtin_neon_vqsub_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2); 24741 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 24742 return __ret; 24743 } 24744 #endif 24745 24746 __ai __attribute__((target("neon"))) int64x1_t vqsub_s64(int64x1_t __p0, int64x1_t __p1) { 24747 int64x1_t __ret; 24748 __ret = (int64x1_t) __builtin_neon_vqsub_v((int8x8_t)__p0, (int8x8_t)__p1, 3); 24749 return __ret; 24750 } 24751 #ifdef __LITTLE_ENDIAN__ 24752 __ai __attribute__((target("neon"))) int16x4_t vqsub_s16(int16x4_t __p0, int16x4_t __p1) { 24753 int16x4_t __ret; 24754 __ret = (int16x4_t) __builtin_neon_vqsub_v((int8x8_t)__p0, (int8x8_t)__p1, 1); 24755 return __ret; 24756 } 24757 #else 24758 __ai __attribute__((target("neon"))) int16x4_t vqsub_s16(int16x4_t __p0, int16x4_t __p1) { 24759 int16x4_t __ret; 24760 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 24761 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 24762 __ret = (int16x4_t) __builtin_neon_vqsub_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1); 24763 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 24764 return __ret; 24765 } 24766 #endif 24767 24768 #ifdef __LITTLE_ENDIAN__ 24769 __ai __attribute__((target("neon"))) uint16x4_t vraddhn_u32(uint32x4_t __p0, uint32x4_t __p1) { 24770 uint16x4_t __ret; 24771 __ret = (uint16x4_t) __builtin_neon_vraddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 17); 24772 return __ret; 24773 } 24774 #else 24775 __ai __attribute__((target("neon"))) uint16x4_t vraddhn_u32(uint32x4_t __p0, uint32x4_t __p1) { 24776 uint16x4_t __ret; 24777 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 24778 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 24779 __ret = (uint16x4_t) __builtin_neon_vraddhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 17); 24780 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 24781 return __ret; 24782 } 24783 __ai __attribute__((target("neon"))) uint16x4_t __noswap_vraddhn_u32(uint32x4_t __p0, uint32x4_t __p1) { 24784 uint16x4_t __ret; 24785 __ret = (uint16x4_t) __builtin_neon_vraddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 17); 24786 return __ret; 24787 } 24788 #endif 24789 24790 #ifdef __LITTLE_ENDIAN__ 24791 __ai __attribute__((target("neon"))) uint32x2_t vraddhn_u64(uint64x2_t __p0, uint64x2_t __p1) { 24792 uint32x2_t __ret; 24793 __ret = (uint32x2_t) __builtin_neon_vraddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 18); 24794 return __ret; 24795 } 24796 #else 24797 __ai __attribute__((target("neon"))) uint32x2_t vraddhn_u64(uint64x2_t __p0, uint64x2_t __p1) { 24798 uint32x2_t __ret; 24799 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 24800 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 24801 __ret = (uint32x2_t) __builtin_neon_vraddhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 18); 24802 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 24803 return __ret; 24804 } 24805 __ai __attribute__((target("neon"))) uint32x2_t __noswap_vraddhn_u64(uint64x2_t __p0, uint64x2_t __p1) { 24806 uint32x2_t __ret; 24807 __ret = (uint32x2_t) __builtin_neon_vraddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 18); 24808 return __ret; 24809 } 24810 #endif 24811 24812 #ifdef __LITTLE_ENDIAN__ 24813 __ai __attribute__((target("neon"))) uint8x8_t vraddhn_u16(uint16x8_t __p0, uint16x8_t __p1) { 24814 uint8x8_t __ret; 24815 __ret = (uint8x8_t) __builtin_neon_vraddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 16); 24816 return __ret; 24817 } 24818 #else 24819 __ai __attribute__((target("neon"))) uint8x8_t vraddhn_u16(uint16x8_t __p0, uint16x8_t __p1) { 24820 uint8x8_t __ret; 24821 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 24822 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 24823 __ret = (uint8x8_t) __builtin_neon_vraddhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 16); 24824 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 24825 return __ret; 24826 } 24827 __ai __attribute__((target("neon"))) uint8x8_t __noswap_vraddhn_u16(uint16x8_t __p0, uint16x8_t __p1) { 24828 uint8x8_t __ret; 24829 __ret = (uint8x8_t) __builtin_neon_vraddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 16); 24830 return __ret; 24831 } 24832 #endif 24833 24834 #ifdef __LITTLE_ENDIAN__ 24835 __ai __attribute__((target("neon"))) int16x4_t vraddhn_s32(int32x4_t __p0, int32x4_t __p1) { 24836 int16x4_t __ret; 24837 __ret = (int16x4_t) __builtin_neon_vraddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 1); 24838 return __ret; 24839 } 24840 #else 24841 __ai __attribute__((target("neon"))) int16x4_t vraddhn_s32(int32x4_t __p0, int32x4_t __p1) { 24842 int16x4_t __ret; 24843 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 24844 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 24845 __ret = (int16x4_t) __builtin_neon_vraddhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 1); 24846 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 24847 return __ret; 24848 } 24849 __ai __attribute__((target("neon"))) int16x4_t __noswap_vraddhn_s32(int32x4_t __p0, int32x4_t __p1) { 24850 int16x4_t __ret; 24851 __ret = (int16x4_t) __builtin_neon_vraddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 1); 24852 return __ret; 24853 } 24854 #endif 24855 24856 #ifdef __LITTLE_ENDIAN__ 24857 __ai __attribute__((target("neon"))) int32x2_t vraddhn_s64(int64x2_t __p0, int64x2_t __p1) { 24858 int32x2_t __ret; 24859 __ret = (int32x2_t) __builtin_neon_vraddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 2); 24860 return __ret; 24861 } 24862 #else 24863 __ai __attribute__((target("neon"))) int32x2_t vraddhn_s64(int64x2_t __p0, int64x2_t __p1) { 24864 int32x2_t __ret; 24865 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 24866 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 24867 __ret = (int32x2_t) __builtin_neon_vraddhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 2); 24868 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 24869 return __ret; 24870 } 24871 __ai __attribute__((target("neon"))) int32x2_t __noswap_vraddhn_s64(int64x2_t __p0, int64x2_t __p1) { 24872 int32x2_t __ret; 24873 __ret = (int32x2_t) __builtin_neon_vraddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 2); 24874 return __ret; 24875 } 24876 #endif 24877 24878 #ifdef __LITTLE_ENDIAN__ 24879 __ai __attribute__((target("neon"))) int8x8_t vraddhn_s16(int16x8_t __p0, int16x8_t __p1) { 24880 int8x8_t __ret; 24881 __ret = (int8x8_t) __builtin_neon_vraddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 0); 24882 return __ret; 24883 } 24884 #else 24885 __ai __attribute__((target("neon"))) int8x8_t vraddhn_s16(int16x8_t __p0, int16x8_t __p1) { 24886 int8x8_t __ret; 24887 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 24888 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 24889 __ret = (int8x8_t) __builtin_neon_vraddhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 0); 24890 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 24891 return __ret; 24892 } 24893 __ai __attribute__((target("neon"))) int8x8_t __noswap_vraddhn_s16(int16x8_t __p0, int16x8_t __p1) { 24894 int8x8_t __ret; 24895 __ret = (int8x8_t) __builtin_neon_vraddhn_v((int8x16_t)__p0, (int8x16_t)__p1, 0); 24896 return __ret; 24897 } 24898 #endif 24899 24900 #ifdef __LITTLE_ENDIAN__ 24901 __ai __attribute__((target("neon"))) uint32x4_t vrecpeq_u32(uint32x4_t __p0) { 24902 uint32x4_t __ret; 24903 __ret = (uint32x4_t) __builtin_neon_vrecpeq_v((int8x16_t)__p0, 50); 24904 return __ret; 24905 } 24906 #else 24907 __ai __attribute__((target("neon"))) uint32x4_t vrecpeq_u32(uint32x4_t __p0) { 24908 uint32x4_t __ret; 24909 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 24910 __ret = (uint32x4_t) __builtin_neon_vrecpeq_v((int8x16_t)__rev0, 50); 24911 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 24912 return __ret; 24913 } 24914 #endif 24915 24916 #ifdef __LITTLE_ENDIAN__ 24917 __ai __attribute__((target("neon"))) float32x4_t vrecpeq_f32(float32x4_t __p0) { 24918 float32x4_t __ret; 24919 __ret = (float32x4_t) __builtin_neon_vrecpeq_v((int8x16_t)__p0, 41); 24920 return __ret; 24921 } 24922 #else 24923 __ai __attribute__((target("neon"))) float32x4_t vrecpeq_f32(float32x4_t __p0) { 24924 float32x4_t __ret; 24925 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 24926 __ret = (float32x4_t) __builtin_neon_vrecpeq_v((int8x16_t)__rev0, 41); 24927 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 24928 return __ret; 24929 } 24930 #endif 24931 24932 #ifdef __LITTLE_ENDIAN__ 24933 __ai __attribute__((target("neon"))) uint32x2_t vrecpe_u32(uint32x2_t __p0) { 24934 uint32x2_t __ret; 24935 __ret = (uint32x2_t) __builtin_neon_vrecpe_v((int8x8_t)__p0, 18); 24936 return __ret; 24937 } 24938 #else 24939 __ai __attribute__((target("neon"))) uint32x2_t vrecpe_u32(uint32x2_t __p0) { 24940 uint32x2_t __ret; 24941 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 24942 __ret = (uint32x2_t) __builtin_neon_vrecpe_v((int8x8_t)__rev0, 18); 24943 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 24944 return __ret; 24945 } 24946 #endif 24947 24948 #ifdef __LITTLE_ENDIAN__ 24949 __ai __attribute__((target("neon"))) float32x2_t vrecpe_f32(float32x2_t __p0) { 24950 float32x2_t __ret; 24951 __ret = (float32x2_t) __builtin_neon_vrecpe_v((int8x8_t)__p0, 9); 24952 return __ret; 24953 } 24954 #else 24955 __ai __attribute__((target("neon"))) float32x2_t vrecpe_f32(float32x2_t __p0) { 24956 float32x2_t __ret; 24957 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 24958 __ret = (float32x2_t) __builtin_neon_vrecpe_v((int8x8_t)__rev0, 9); 24959 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 24960 return __ret; 24961 } 24962 #endif 24963 24964 #ifdef __LITTLE_ENDIAN__ 24965 __ai __attribute__((target("neon"))) float32x4_t vrecpsq_f32(float32x4_t __p0, float32x4_t __p1) { 24966 float32x4_t __ret; 24967 __ret = (float32x4_t) __builtin_neon_vrecpsq_v((int8x16_t)__p0, (int8x16_t)__p1, 41); 24968 return __ret; 24969 } 24970 #else 24971 __ai __attribute__((target("neon"))) float32x4_t vrecpsq_f32(float32x4_t __p0, float32x4_t __p1) { 24972 float32x4_t __ret; 24973 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 24974 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 24975 __ret = (float32x4_t) __builtin_neon_vrecpsq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 41); 24976 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 24977 return __ret; 24978 } 24979 #endif 24980 24981 #ifdef __LITTLE_ENDIAN__ 24982 __ai __attribute__((target("neon"))) float32x2_t vrecps_f32(float32x2_t __p0, float32x2_t __p1) { 24983 float32x2_t __ret; 24984 __ret = (float32x2_t) __builtin_neon_vrecps_v((int8x8_t)__p0, (int8x8_t)__p1, 9); 24985 return __ret; 24986 } 24987 #else 24988 __ai __attribute__((target("neon"))) float32x2_t vrecps_f32(float32x2_t __p0, float32x2_t __p1) { 24989 float32x2_t __ret; 24990 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 24991 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 24992 __ret = (float32x2_t) __builtin_neon_vrecps_v((int8x8_t)__rev0, (int8x8_t)__rev1, 9); 24993 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 24994 return __ret; 24995 } 24996 #endif 24997 24998 #ifdef __LITTLE_ENDIAN__ 24999 __ai __attribute__((target("neon"))) poly8x8_t vrev16_p8(poly8x8_t __p0) { 25000 poly8x8_t __ret; 25001 __ret = __builtin_shufflevector(__p0, __p0, 1, 0, 3, 2, 5, 4, 7, 6); 25002 return __ret; 25003 } 25004 #else 25005 __ai __attribute__((target("neon"))) poly8x8_t vrev16_p8(poly8x8_t __p0) { 25006 poly8x8_t __ret; 25007 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 25008 __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0, 3, 2, 5, 4, 7, 6); 25009 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 25010 return __ret; 25011 } 25012 #endif 25013 25014 #ifdef __LITTLE_ENDIAN__ 25015 __ai __attribute__((target("neon"))) poly8x16_t vrev16q_p8(poly8x16_t __p0) { 25016 poly8x16_t __ret; 25017 __ret = __builtin_shufflevector(__p0, __p0, 1, 0, 3, 2, 5, 4, 7, 6, 9, 8, 11, 10, 13, 12, 15, 14); 25018 return __ret; 25019 } 25020 #else 25021 __ai __attribute__((target("neon"))) poly8x16_t vrev16q_p8(poly8x16_t __p0) { 25022 poly8x16_t __ret; 25023 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 25024 __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0, 3, 2, 5, 4, 7, 6, 9, 8, 11, 10, 13, 12, 15, 14); 25025 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 25026 return __ret; 25027 } 25028 #endif 25029 25030 #ifdef __LITTLE_ENDIAN__ 25031 __ai __attribute__((target("neon"))) uint8x16_t vrev16q_u8(uint8x16_t __p0) { 25032 uint8x16_t __ret; 25033 __ret = __builtin_shufflevector(__p0, __p0, 1, 0, 3, 2, 5, 4, 7, 6, 9, 8, 11, 10, 13, 12, 15, 14); 25034 return __ret; 25035 } 25036 #else 25037 __ai __attribute__((target("neon"))) uint8x16_t vrev16q_u8(uint8x16_t __p0) { 25038 uint8x16_t __ret; 25039 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 25040 __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0, 3, 2, 5, 4, 7, 6, 9, 8, 11, 10, 13, 12, 15, 14); 25041 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 25042 return __ret; 25043 } 25044 #endif 25045 25046 #ifdef __LITTLE_ENDIAN__ 25047 __ai __attribute__((target("neon"))) int8x16_t vrev16q_s8(int8x16_t __p0) { 25048 int8x16_t __ret; 25049 __ret = __builtin_shufflevector(__p0, __p0, 1, 0, 3, 2, 5, 4, 7, 6, 9, 8, 11, 10, 13, 12, 15, 14); 25050 return __ret; 25051 } 25052 #else 25053 __ai __attribute__((target("neon"))) int8x16_t vrev16q_s8(int8x16_t __p0) { 25054 int8x16_t __ret; 25055 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 25056 __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0, 3, 2, 5, 4, 7, 6, 9, 8, 11, 10, 13, 12, 15, 14); 25057 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 25058 return __ret; 25059 } 25060 #endif 25061 25062 #ifdef __LITTLE_ENDIAN__ 25063 __ai __attribute__((target("neon"))) uint8x8_t vrev16_u8(uint8x8_t __p0) { 25064 uint8x8_t __ret; 25065 __ret = __builtin_shufflevector(__p0, __p0, 1, 0, 3, 2, 5, 4, 7, 6); 25066 return __ret; 25067 } 25068 #else 25069 __ai __attribute__((target("neon"))) uint8x8_t vrev16_u8(uint8x8_t __p0) { 25070 uint8x8_t __ret; 25071 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 25072 __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0, 3, 2, 5, 4, 7, 6); 25073 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 25074 return __ret; 25075 } 25076 #endif 25077 25078 #ifdef __LITTLE_ENDIAN__ 25079 __ai __attribute__((target("neon"))) int8x8_t vrev16_s8(int8x8_t __p0) { 25080 int8x8_t __ret; 25081 __ret = __builtin_shufflevector(__p0, __p0, 1, 0, 3, 2, 5, 4, 7, 6); 25082 return __ret; 25083 } 25084 #else 25085 __ai __attribute__((target("neon"))) int8x8_t vrev16_s8(int8x8_t __p0) { 25086 int8x8_t __ret; 25087 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 25088 __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0, 3, 2, 5, 4, 7, 6); 25089 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 25090 return __ret; 25091 } 25092 #endif 25093 25094 #ifdef __LITTLE_ENDIAN__ 25095 __ai __attribute__((target("neon"))) poly8x8_t vrev32_p8(poly8x8_t __p0) { 25096 poly8x8_t __ret; 25097 __ret = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0, 7, 6, 5, 4); 25098 return __ret; 25099 } 25100 #else 25101 __ai __attribute__((target("neon"))) poly8x8_t vrev32_p8(poly8x8_t __p0) { 25102 poly8x8_t __ret; 25103 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 25104 __ret = __builtin_shufflevector(__rev0, __rev0, 3, 2, 1, 0, 7, 6, 5, 4); 25105 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 25106 return __ret; 25107 } 25108 #endif 25109 25110 #ifdef __LITTLE_ENDIAN__ 25111 __ai __attribute__((target("neon"))) poly16x4_t vrev32_p16(poly16x4_t __p0) { 25112 poly16x4_t __ret; 25113 __ret = __builtin_shufflevector(__p0, __p0, 1, 0, 3, 2); 25114 return __ret; 25115 } 25116 #else 25117 __ai __attribute__((target("neon"))) poly16x4_t vrev32_p16(poly16x4_t __p0) { 25118 poly16x4_t __ret; 25119 poly16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 25120 __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0, 3, 2); 25121 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 25122 return __ret; 25123 } 25124 #endif 25125 25126 #ifdef __LITTLE_ENDIAN__ 25127 __ai __attribute__((target("neon"))) poly8x16_t vrev32q_p8(poly8x16_t __p0) { 25128 poly8x16_t __ret; 25129 __ret = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0, 7, 6, 5, 4, 11, 10, 9, 8, 15, 14, 13, 12); 25130 return __ret; 25131 } 25132 #else 25133 __ai __attribute__((target("neon"))) poly8x16_t vrev32q_p8(poly8x16_t __p0) { 25134 poly8x16_t __ret; 25135 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 25136 __ret = __builtin_shufflevector(__rev0, __rev0, 3, 2, 1, 0, 7, 6, 5, 4, 11, 10, 9, 8, 15, 14, 13, 12); 25137 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 25138 return __ret; 25139 } 25140 #endif 25141 25142 #ifdef __LITTLE_ENDIAN__ 25143 __ai __attribute__((target("neon"))) poly16x8_t vrev32q_p16(poly16x8_t __p0) { 25144 poly16x8_t __ret; 25145 __ret = __builtin_shufflevector(__p0, __p0, 1, 0, 3, 2, 5, 4, 7, 6); 25146 return __ret; 25147 } 25148 #else 25149 __ai __attribute__((target("neon"))) poly16x8_t vrev32q_p16(poly16x8_t __p0) { 25150 poly16x8_t __ret; 25151 poly16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 25152 __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0, 3, 2, 5, 4, 7, 6); 25153 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 25154 return __ret; 25155 } 25156 #endif 25157 25158 #ifdef __LITTLE_ENDIAN__ 25159 __ai __attribute__((target("neon"))) uint8x16_t vrev32q_u8(uint8x16_t __p0) { 25160 uint8x16_t __ret; 25161 __ret = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0, 7, 6, 5, 4, 11, 10, 9, 8, 15, 14, 13, 12); 25162 return __ret; 25163 } 25164 #else 25165 __ai __attribute__((target("neon"))) uint8x16_t vrev32q_u8(uint8x16_t __p0) { 25166 uint8x16_t __ret; 25167 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 25168 __ret = __builtin_shufflevector(__rev0, __rev0, 3, 2, 1, 0, 7, 6, 5, 4, 11, 10, 9, 8, 15, 14, 13, 12); 25169 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 25170 return __ret; 25171 } 25172 #endif 25173 25174 #ifdef __LITTLE_ENDIAN__ 25175 __ai __attribute__((target("neon"))) uint16x8_t vrev32q_u16(uint16x8_t __p0) { 25176 uint16x8_t __ret; 25177 __ret = __builtin_shufflevector(__p0, __p0, 1, 0, 3, 2, 5, 4, 7, 6); 25178 return __ret; 25179 } 25180 #else 25181 __ai __attribute__((target("neon"))) uint16x8_t vrev32q_u16(uint16x8_t __p0) { 25182 uint16x8_t __ret; 25183 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 25184 __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0, 3, 2, 5, 4, 7, 6); 25185 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 25186 return __ret; 25187 } 25188 #endif 25189 25190 #ifdef __LITTLE_ENDIAN__ 25191 __ai __attribute__((target("neon"))) int8x16_t vrev32q_s8(int8x16_t __p0) { 25192 int8x16_t __ret; 25193 __ret = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0, 7, 6, 5, 4, 11, 10, 9, 8, 15, 14, 13, 12); 25194 return __ret; 25195 } 25196 #else 25197 __ai __attribute__((target("neon"))) int8x16_t vrev32q_s8(int8x16_t __p0) { 25198 int8x16_t __ret; 25199 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 25200 __ret = __builtin_shufflevector(__rev0, __rev0, 3, 2, 1, 0, 7, 6, 5, 4, 11, 10, 9, 8, 15, 14, 13, 12); 25201 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 25202 return __ret; 25203 } 25204 #endif 25205 25206 #ifdef __LITTLE_ENDIAN__ 25207 __ai __attribute__((target("neon"))) int16x8_t vrev32q_s16(int16x8_t __p0) { 25208 int16x8_t __ret; 25209 __ret = __builtin_shufflevector(__p0, __p0, 1, 0, 3, 2, 5, 4, 7, 6); 25210 return __ret; 25211 } 25212 #else 25213 __ai __attribute__((target("neon"))) int16x8_t vrev32q_s16(int16x8_t __p0) { 25214 int16x8_t __ret; 25215 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 25216 __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0, 3, 2, 5, 4, 7, 6); 25217 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 25218 return __ret; 25219 } 25220 #endif 25221 25222 #ifdef __LITTLE_ENDIAN__ 25223 __ai __attribute__((target("neon"))) uint8x8_t vrev32_u8(uint8x8_t __p0) { 25224 uint8x8_t __ret; 25225 __ret = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0, 7, 6, 5, 4); 25226 return __ret; 25227 } 25228 #else 25229 __ai __attribute__((target("neon"))) uint8x8_t vrev32_u8(uint8x8_t __p0) { 25230 uint8x8_t __ret; 25231 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 25232 __ret = __builtin_shufflevector(__rev0, __rev0, 3, 2, 1, 0, 7, 6, 5, 4); 25233 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 25234 return __ret; 25235 } 25236 #endif 25237 25238 #ifdef __LITTLE_ENDIAN__ 25239 __ai __attribute__((target("neon"))) uint16x4_t vrev32_u16(uint16x4_t __p0) { 25240 uint16x4_t __ret; 25241 __ret = __builtin_shufflevector(__p0, __p0, 1, 0, 3, 2); 25242 return __ret; 25243 } 25244 #else 25245 __ai __attribute__((target("neon"))) uint16x4_t vrev32_u16(uint16x4_t __p0) { 25246 uint16x4_t __ret; 25247 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 25248 __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0, 3, 2); 25249 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 25250 return __ret; 25251 } 25252 #endif 25253 25254 #ifdef __LITTLE_ENDIAN__ 25255 __ai __attribute__((target("neon"))) int8x8_t vrev32_s8(int8x8_t __p0) { 25256 int8x8_t __ret; 25257 __ret = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0, 7, 6, 5, 4); 25258 return __ret; 25259 } 25260 #else 25261 __ai __attribute__((target("neon"))) int8x8_t vrev32_s8(int8x8_t __p0) { 25262 int8x8_t __ret; 25263 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 25264 __ret = __builtin_shufflevector(__rev0, __rev0, 3, 2, 1, 0, 7, 6, 5, 4); 25265 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 25266 return __ret; 25267 } 25268 #endif 25269 25270 #ifdef __LITTLE_ENDIAN__ 25271 __ai __attribute__((target("neon"))) int16x4_t vrev32_s16(int16x4_t __p0) { 25272 int16x4_t __ret; 25273 __ret = __builtin_shufflevector(__p0, __p0, 1, 0, 3, 2); 25274 return __ret; 25275 } 25276 #else 25277 __ai __attribute__((target("neon"))) int16x4_t vrev32_s16(int16x4_t __p0) { 25278 int16x4_t __ret; 25279 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 25280 __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0, 3, 2); 25281 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 25282 return __ret; 25283 } 25284 #endif 25285 25286 #ifdef __LITTLE_ENDIAN__ 25287 __ai __attribute__((target("neon"))) poly8x8_t vrev64_p8(poly8x8_t __p0) { 25288 poly8x8_t __ret; 25289 __ret = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 25290 return __ret; 25291 } 25292 #else 25293 __ai __attribute__((target("neon"))) poly8x8_t vrev64_p8(poly8x8_t __p0) { 25294 poly8x8_t __ret; 25295 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 25296 __ret = __builtin_shufflevector(__rev0, __rev0, 7, 6, 5, 4, 3, 2, 1, 0); 25297 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 25298 return __ret; 25299 } 25300 #endif 25301 25302 #ifdef __LITTLE_ENDIAN__ 25303 __ai __attribute__((target("neon"))) poly16x4_t vrev64_p16(poly16x4_t __p0) { 25304 poly16x4_t __ret; 25305 __ret = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 25306 return __ret; 25307 } 25308 #else 25309 __ai __attribute__((target("neon"))) poly16x4_t vrev64_p16(poly16x4_t __p0) { 25310 poly16x4_t __ret; 25311 poly16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 25312 __ret = __builtin_shufflevector(__rev0, __rev0, 3, 2, 1, 0); 25313 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 25314 return __ret; 25315 } 25316 #endif 25317 25318 #ifdef __LITTLE_ENDIAN__ 25319 __ai __attribute__((target("neon"))) poly8x16_t vrev64q_p8(poly8x16_t __p0) { 25320 poly8x16_t __ret; 25321 __ret = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0, 15, 14, 13, 12, 11, 10, 9, 8); 25322 return __ret; 25323 } 25324 #else 25325 __ai __attribute__((target("neon"))) poly8x16_t vrev64q_p8(poly8x16_t __p0) { 25326 poly8x16_t __ret; 25327 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 25328 __ret = __builtin_shufflevector(__rev0, __rev0, 7, 6, 5, 4, 3, 2, 1, 0, 15, 14, 13, 12, 11, 10, 9, 8); 25329 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 25330 return __ret; 25331 } 25332 #endif 25333 25334 #ifdef __LITTLE_ENDIAN__ 25335 __ai __attribute__((target("neon"))) poly16x8_t vrev64q_p16(poly16x8_t __p0) { 25336 poly16x8_t __ret; 25337 __ret = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0, 7, 6, 5, 4); 25338 return __ret; 25339 } 25340 #else 25341 __ai __attribute__((target("neon"))) poly16x8_t vrev64q_p16(poly16x8_t __p0) { 25342 poly16x8_t __ret; 25343 poly16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 25344 __ret = __builtin_shufflevector(__rev0, __rev0, 3, 2, 1, 0, 7, 6, 5, 4); 25345 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 25346 return __ret; 25347 } 25348 #endif 25349 25350 #ifdef __LITTLE_ENDIAN__ 25351 __ai __attribute__((target("neon"))) uint8x16_t vrev64q_u8(uint8x16_t __p0) { 25352 uint8x16_t __ret; 25353 __ret = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0, 15, 14, 13, 12, 11, 10, 9, 8); 25354 return __ret; 25355 } 25356 #else 25357 __ai __attribute__((target("neon"))) uint8x16_t vrev64q_u8(uint8x16_t __p0) { 25358 uint8x16_t __ret; 25359 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 25360 __ret = __builtin_shufflevector(__rev0, __rev0, 7, 6, 5, 4, 3, 2, 1, 0, 15, 14, 13, 12, 11, 10, 9, 8); 25361 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 25362 return __ret; 25363 } 25364 #endif 25365 25366 #ifdef __LITTLE_ENDIAN__ 25367 __ai __attribute__((target("neon"))) uint32x4_t vrev64q_u32(uint32x4_t __p0) { 25368 uint32x4_t __ret; 25369 __ret = __builtin_shufflevector(__p0, __p0, 1, 0, 3, 2); 25370 return __ret; 25371 } 25372 #else 25373 __ai __attribute__((target("neon"))) uint32x4_t vrev64q_u32(uint32x4_t __p0) { 25374 uint32x4_t __ret; 25375 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 25376 __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0, 3, 2); 25377 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 25378 return __ret; 25379 } 25380 #endif 25381 25382 #ifdef __LITTLE_ENDIAN__ 25383 __ai __attribute__((target("neon"))) uint16x8_t vrev64q_u16(uint16x8_t __p0) { 25384 uint16x8_t __ret; 25385 __ret = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0, 7, 6, 5, 4); 25386 return __ret; 25387 } 25388 #else 25389 __ai __attribute__((target("neon"))) uint16x8_t vrev64q_u16(uint16x8_t __p0) { 25390 uint16x8_t __ret; 25391 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 25392 __ret = __builtin_shufflevector(__rev0, __rev0, 3, 2, 1, 0, 7, 6, 5, 4); 25393 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 25394 return __ret; 25395 } 25396 #endif 25397 25398 #ifdef __LITTLE_ENDIAN__ 25399 __ai __attribute__((target("neon"))) int8x16_t vrev64q_s8(int8x16_t __p0) { 25400 int8x16_t __ret; 25401 __ret = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0, 15, 14, 13, 12, 11, 10, 9, 8); 25402 return __ret; 25403 } 25404 #else 25405 __ai __attribute__((target("neon"))) int8x16_t vrev64q_s8(int8x16_t __p0) { 25406 int8x16_t __ret; 25407 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 25408 __ret = __builtin_shufflevector(__rev0, __rev0, 7, 6, 5, 4, 3, 2, 1, 0, 15, 14, 13, 12, 11, 10, 9, 8); 25409 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 25410 return __ret; 25411 } 25412 #endif 25413 25414 #ifdef __LITTLE_ENDIAN__ 25415 __ai __attribute__((target("neon"))) float32x4_t vrev64q_f32(float32x4_t __p0) { 25416 float32x4_t __ret; 25417 __ret = __builtin_shufflevector(__p0, __p0, 1, 0, 3, 2); 25418 return __ret; 25419 } 25420 #else 25421 __ai __attribute__((target("neon"))) float32x4_t vrev64q_f32(float32x4_t __p0) { 25422 float32x4_t __ret; 25423 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 25424 __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0, 3, 2); 25425 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 25426 return __ret; 25427 } 25428 #endif 25429 25430 #ifdef __LITTLE_ENDIAN__ 25431 __ai __attribute__((target("neon"))) int32x4_t vrev64q_s32(int32x4_t __p0) { 25432 int32x4_t __ret; 25433 __ret = __builtin_shufflevector(__p0, __p0, 1, 0, 3, 2); 25434 return __ret; 25435 } 25436 #else 25437 __ai __attribute__((target("neon"))) int32x4_t vrev64q_s32(int32x4_t __p0) { 25438 int32x4_t __ret; 25439 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 25440 __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0, 3, 2); 25441 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 25442 return __ret; 25443 } 25444 #endif 25445 25446 #ifdef __LITTLE_ENDIAN__ 25447 __ai __attribute__((target("neon"))) int16x8_t vrev64q_s16(int16x8_t __p0) { 25448 int16x8_t __ret; 25449 __ret = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0, 7, 6, 5, 4); 25450 return __ret; 25451 } 25452 #else 25453 __ai __attribute__((target("neon"))) int16x8_t vrev64q_s16(int16x8_t __p0) { 25454 int16x8_t __ret; 25455 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 25456 __ret = __builtin_shufflevector(__rev0, __rev0, 3, 2, 1, 0, 7, 6, 5, 4); 25457 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 25458 return __ret; 25459 } 25460 #endif 25461 25462 #ifdef __LITTLE_ENDIAN__ 25463 __ai __attribute__((target("neon"))) uint8x8_t vrev64_u8(uint8x8_t __p0) { 25464 uint8x8_t __ret; 25465 __ret = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 25466 return __ret; 25467 } 25468 #else 25469 __ai __attribute__((target("neon"))) uint8x8_t vrev64_u8(uint8x8_t __p0) { 25470 uint8x8_t __ret; 25471 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 25472 __ret = __builtin_shufflevector(__rev0, __rev0, 7, 6, 5, 4, 3, 2, 1, 0); 25473 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 25474 return __ret; 25475 } 25476 #endif 25477 25478 #ifdef __LITTLE_ENDIAN__ 25479 __ai __attribute__((target("neon"))) uint32x2_t vrev64_u32(uint32x2_t __p0) { 25480 uint32x2_t __ret; 25481 __ret = __builtin_shufflevector(__p0, __p0, 1, 0); 25482 return __ret; 25483 } 25484 #else 25485 __ai __attribute__((target("neon"))) uint32x2_t vrev64_u32(uint32x2_t __p0) { 25486 uint32x2_t __ret; 25487 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 25488 __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0); 25489 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 25490 return __ret; 25491 } 25492 #endif 25493 25494 #ifdef __LITTLE_ENDIAN__ 25495 __ai __attribute__((target("neon"))) uint16x4_t vrev64_u16(uint16x4_t __p0) { 25496 uint16x4_t __ret; 25497 __ret = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 25498 return __ret; 25499 } 25500 #else 25501 __ai __attribute__((target("neon"))) uint16x4_t vrev64_u16(uint16x4_t __p0) { 25502 uint16x4_t __ret; 25503 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 25504 __ret = __builtin_shufflevector(__rev0, __rev0, 3, 2, 1, 0); 25505 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 25506 return __ret; 25507 } 25508 #endif 25509 25510 #ifdef __LITTLE_ENDIAN__ 25511 __ai __attribute__((target("neon"))) int8x8_t vrev64_s8(int8x8_t __p0) { 25512 int8x8_t __ret; 25513 __ret = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 25514 return __ret; 25515 } 25516 #else 25517 __ai __attribute__((target("neon"))) int8x8_t vrev64_s8(int8x8_t __p0) { 25518 int8x8_t __ret; 25519 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 25520 __ret = __builtin_shufflevector(__rev0, __rev0, 7, 6, 5, 4, 3, 2, 1, 0); 25521 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 25522 return __ret; 25523 } 25524 #endif 25525 25526 #ifdef __LITTLE_ENDIAN__ 25527 __ai __attribute__((target("neon"))) float32x2_t vrev64_f32(float32x2_t __p0) { 25528 float32x2_t __ret; 25529 __ret = __builtin_shufflevector(__p0, __p0, 1, 0); 25530 return __ret; 25531 } 25532 #else 25533 __ai __attribute__((target("neon"))) float32x2_t vrev64_f32(float32x2_t __p0) { 25534 float32x2_t __ret; 25535 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 25536 __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0); 25537 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 25538 return __ret; 25539 } 25540 #endif 25541 25542 #ifdef __LITTLE_ENDIAN__ 25543 __ai __attribute__((target("neon"))) int32x2_t vrev64_s32(int32x2_t __p0) { 25544 int32x2_t __ret; 25545 __ret = __builtin_shufflevector(__p0, __p0, 1, 0); 25546 return __ret; 25547 } 25548 #else 25549 __ai __attribute__((target("neon"))) int32x2_t vrev64_s32(int32x2_t __p0) { 25550 int32x2_t __ret; 25551 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 25552 __ret = __builtin_shufflevector(__rev0, __rev0, 1, 0); 25553 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 25554 return __ret; 25555 } 25556 #endif 25557 25558 #ifdef __LITTLE_ENDIAN__ 25559 __ai __attribute__((target("neon"))) int16x4_t vrev64_s16(int16x4_t __p0) { 25560 int16x4_t __ret; 25561 __ret = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 25562 return __ret; 25563 } 25564 #else 25565 __ai __attribute__((target("neon"))) int16x4_t vrev64_s16(int16x4_t __p0) { 25566 int16x4_t __ret; 25567 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 25568 __ret = __builtin_shufflevector(__rev0, __rev0, 3, 2, 1, 0); 25569 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 25570 return __ret; 25571 } 25572 #endif 25573 25574 #ifdef __LITTLE_ENDIAN__ 25575 __ai __attribute__((target("neon"))) float16x8_t vrev64q_f16(float16x8_t __p0) { 25576 float16x8_t __ret; 25577 __ret = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0, 7, 6, 5, 4); 25578 return __ret; 25579 } 25580 #else 25581 __ai __attribute__((target("neon"))) float16x8_t vrev64q_f16(float16x8_t __p0) { 25582 float16x8_t __ret; 25583 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 25584 __ret = __builtin_shufflevector(__rev0, __rev0, 3, 2, 1, 0, 7, 6, 5, 4); 25585 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 25586 return __ret; 25587 } 25588 #endif 25589 25590 #ifdef __LITTLE_ENDIAN__ 25591 __ai __attribute__((target("neon"))) float16x4_t vrev64_f16(float16x4_t __p0) { 25592 float16x4_t __ret; 25593 __ret = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 25594 return __ret; 25595 } 25596 #else 25597 __ai __attribute__((target("neon"))) float16x4_t vrev64_f16(float16x4_t __p0) { 25598 float16x4_t __ret; 25599 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 25600 __ret = __builtin_shufflevector(__rev0, __rev0, 3, 2, 1, 0); 25601 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 25602 return __ret; 25603 } 25604 #endif 25605 25606 #ifdef __LITTLE_ENDIAN__ 25607 __ai __attribute__((target("neon"))) uint8x16_t vrhaddq_u8(uint8x16_t __p0, uint8x16_t __p1) { 25608 uint8x16_t __ret; 25609 __ret = (uint8x16_t) __builtin_neon_vrhaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 48); 25610 return __ret; 25611 } 25612 #else 25613 __ai __attribute__((target("neon"))) uint8x16_t vrhaddq_u8(uint8x16_t __p0, uint8x16_t __p1) { 25614 uint8x16_t __ret; 25615 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 25616 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 25617 __ret = (uint8x16_t) __builtin_neon_vrhaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48); 25618 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 25619 return __ret; 25620 } 25621 #endif 25622 25623 #ifdef __LITTLE_ENDIAN__ 25624 __ai __attribute__((target("neon"))) uint32x4_t vrhaddq_u32(uint32x4_t __p0, uint32x4_t __p1) { 25625 uint32x4_t __ret; 25626 __ret = (uint32x4_t) __builtin_neon_vrhaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 50); 25627 return __ret; 25628 } 25629 #else 25630 __ai __attribute__((target("neon"))) uint32x4_t vrhaddq_u32(uint32x4_t __p0, uint32x4_t __p1) { 25631 uint32x4_t __ret; 25632 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 25633 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 25634 __ret = (uint32x4_t) __builtin_neon_vrhaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50); 25635 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 25636 return __ret; 25637 } 25638 #endif 25639 25640 #ifdef __LITTLE_ENDIAN__ 25641 __ai __attribute__((target("neon"))) uint16x8_t vrhaddq_u16(uint16x8_t __p0, uint16x8_t __p1) { 25642 uint16x8_t __ret; 25643 __ret = (uint16x8_t) __builtin_neon_vrhaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 49); 25644 return __ret; 25645 } 25646 #else 25647 __ai __attribute__((target("neon"))) uint16x8_t vrhaddq_u16(uint16x8_t __p0, uint16x8_t __p1) { 25648 uint16x8_t __ret; 25649 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 25650 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 25651 __ret = (uint16x8_t) __builtin_neon_vrhaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49); 25652 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 25653 return __ret; 25654 } 25655 #endif 25656 25657 #ifdef __LITTLE_ENDIAN__ 25658 __ai __attribute__((target("neon"))) int8x16_t vrhaddq_s8(int8x16_t __p0, int8x16_t __p1) { 25659 int8x16_t __ret; 25660 __ret = (int8x16_t) __builtin_neon_vrhaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 32); 25661 return __ret; 25662 } 25663 #else 25664 __ai __attribute__((target("neon"))) int8x16_t vrhaddq_s8(int8x16_t __p0, int8x16_t __p1) { 25665 int8x16_t __ret; 25666 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 25667 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 25668 __ret = (int8x16_t) __builtin_neon_vrhaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32); 25669 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 25670 return __ret; 25671 } 25672 #endif 25673 25674 #ifdef __LITTLE_ENDIAN__ 25675 __ai __attribute__((target("neon"))) int32x4_t vrhaddq_s32(int32x4_t __p0, int32x4_t __p1) { 25676 int32x4_t __ret; 25677 __ret = (int32x4_t) __builtin_neon_vrhaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 34); 25678 return __ret; 25679 } 25680 #else 25681 __ai __attribute__((target("neon"))) int32x4_t vrhaddq_s32(int32x4_t __p0, int32x4_t __p1) { 25682 int32x4_t __ret; 25683 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 25684 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 25685 __ret = (int32x4_t) __builtin_neon_vrhaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34); 25686 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 25687 return __ret; 25688 } 25689 #endif 25690 25691 #ifdef __LITTLE_ENDIAN__ 25692 __ai __attribute__((target("neon"))) int16x8_t vrhaddq_s16(int16x8_t __p0, int16x8_t __p1) { 25693 int16x8_t __ret; 25694 __ret = (int16x8_t) __builtin_neon_vrhaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 33); 25695 return __ret; 25696 } 25697 #else 25698 __ai __attribute__((target("neon"))) int16x8_t vrhaddq_s16(int16x8_t __p0, int16x8_t __p1) { 25699 int16x8_t __ret; 25700 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 25701 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 25702 __ret = (int16x8_t) __builtin_neon_vrhaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33); 25703 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 25704 return __ret; 25705 } 25706 #endif 25707 25708 #ifdef __LITTLE_ENDIAN__ 25709 __ai __attribute__((target("neon"))) uint8x8_t vrhadd_u8(uint8x8_t __p0, uint8x8_t __p1) { 25710 uint8x8_t __ret; 25711 __ret = (uint8x8_t) __builtin_neon_vrhadd_v((int8x8_t)__p0, (int8x8_t)__p1, 16); 25712 return __ret; 25713 } 25714 #else 25715 __ai __attribute__((target("neon"))) uint8x8_t vrhadd_u8(uint8x8_t __p0, uint8x8_t __p1) { 25716 uint8x8_t __ret; 25717 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 25718 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 25719 __ret = (uint8x8_t) __builtin_neon_vrhadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16); 25720 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 25721 return __ret; 25722 } 25723 #endif 25724 25725 #ifdef __LITTLE_ENDIAN__ 25726 __ai __attribute__((target("neon"))) uint32x2_t vrhadd_u32(uint32x2_t __p0, uint32x2_t __p1) { 25727 uint32x2_t __ret; 25728 __ret = (uint32x2_t) __builtin_neon_vrhadd_v((int8x8_t)__p0, (int8x8_t)__p1, 18); 25729 return __ret; 25730 } 25731 #else 25732 __ai __attribute__((target("neon"))) uint32x2_t vrhadd_u32(uint32x2_t __p0, uint32x2_t __p1) { 25733 uint32x2_t __ret; 25734 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 25735 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 25736 __ret = (uint32x2_t) __builtin_neon_vrhadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18); 25737 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 25738 return __ret; 25739 } 25740 #endif 25741 25742 #ifdef __LITTLE_ENDIAN__ 25743 __ai __attribute__((target("neon"))) uint16x4_t vrhadd_u16(uint16x4_t __p0, uint16x4_t __p1) { 25744 uint16x4_t __ret; 25745 __ret = (uint16x4_t) __builtin_neon_vrhadd_v((int8x8_t)__p0, (int8x8_t)__p1, 17); 25746 return __ret; 25747 } 25748 #else 25749 __ai __attribute__((target("neon"))) uint16x4_t vrhadd_u16(uint16x4_t __p0, uint16x4_t __p1) { 25750 uint16x4_t __ret; 25751 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 25752 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 25753 __ret = (uint16x4_t) __builtin_neon_vrhadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17); 25754 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 25755 return __ret; 25756 } 25757 #endif 25758 25759 #ifdef __LITTLE_ENDIAN__ 25760 __ai __attribute__((target("neon"))) int8x8_t vrhadd_s8(int8x8_t __p0, int8x8_t __p1) { 25761 int8x8_t __ret; 25762 __ret = (int8x8_t) __builtin_neon_vrhadd_v((int8x8_t)__p0, (int8x8_t)__p1, 0); 25763 return __ret; 25764 } 25765 #else 25766 __ai __attribute__((target("neon"))) int8x8_t vrhadd_s8(int8x8_t __p0, int8x8_t __p1) { 25767 int8x8_t __ret; 25768 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 25769 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 25770 __ret = (int8x8_t) __builtin_neon_vrhadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0); 25771 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 25772 return __ret; 25773 } 25774 #endif 25775 25776 #ifdef __LITTLE_ENDIAN__ 25777 __ai __attribute__((target("neon"))) int32x2_t vrhadd_s32(int32x2_t __p0, int32x2_t __p1) { 25778 int32x2_t __ret; 25779 __ret = (int32x2_t) __builtin_neon_vrhadd_v((int8x8_t)__p0, (int8x8_t)__p1, 2); 25780 return __ret; 25781 } 25782 #else 25783 __ai __attribute__((target("neon"))) int32x2_t vrhadd_s32(int32x2_t __p0, int32x2_t __p1) { 25784 int32x2_t __ret; 25785 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 25786 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 25787 __ret = (int32x2_t) __builtin_neon_vrhadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2); 25788 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 25789 return __ret; 25790 } 25791 #endif 25792 25793 #ifdef __LITTLE_ENDIAN__ 25794 __ai __attribute__((target("neon"))) int16x4_t vrhadd_s16(int16x4_t __p0, int16x4_t __p1) { 25795 int16x4_t __ret; 25796 __ret = (int16x4_t) __builtin_neon_vrhadd_v((int8x8_t)__p0, (int8x8_t)__p1, 1); 25797 return __ret; 25798 } 25799 #else 25800 __ai __attribute__((target("neon"))) int16x4_t vrhadd_s16(int16x4_t __p0, int16x4_t __p1) { 25801 int16x4_t __ret; 25802 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 25803 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 25804 __ret = (int16x4_t) __builtin_neon_vrhadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1); 25805 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 25806 return __ret; 25807 } 25808 #endif 25809 25810 #ifdef __LITTLE_ENDIAN__ 25811 __ai __attribute__((target("neon"))) uint8x16_t vrshlq_u8(uint8x16_t __p0, int8x16_t __p1) { 25812 uint8x16_t __ret; 25813 __ret = (uint8x16_t) __builtin_neon_vrshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 48); 25814 return __ret; 25815 } 25816 #else 25817 __ai __attribute__((target("neon"))) uint8x16_t vrshlq_u8(uint8x16_t __p0, int8x16_t __p1) { 25818 uint8x16_t __ret; 25819 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 25820 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 25821 __ret = (uint8x16_t) __builtin_neon_vrshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48); 25822 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 25823 return __ret; 25824 } 25825 #endif 25826 25827 #ifdef __LITTLE_ENDIAN__ 25828 __ai __attribute__((target("neon"))) uint32x4_t vrshlq_u32(uint32x4_t __p0, int32x4_t __p1) { 25829 uint32x4_t __ret; 25830 __ret = (uint32x4_t) __builtin_neon_vrshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 50); 25831 return __ret; 25832 } 25833 #else 25834 __ai __attribute__((target("neon"))) uint32x4_t vrshlq_u32(uint32x4_t __p0, int32x4_t __p1) { 25835 uint32x4_t __ret; 25836 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 25837 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 25838 __ret = (uint32x4_t) __builtin_neon_vrshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50); 25839 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 25840 return __ret; 25841 } 25842 #endif 25843 25844 #ifdef __LITTLE_ENDIAN__ 25845 __ai __attribute__((target("neon"))) uint64x2_t vrshlq_u64(uint64x2_t __p0, int64x2_t __p1) { 25846 uint64x2_t __ret; 25847 __ret = (uint64x2_t) __builtin_neon_vrshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 51); 25848 return __ret; 25849 } 25850 #else 25851 __ai __attribute__((target("neon"))) uint64x2_t vrshlq_u64(uint64x2_t __p0, int64x2_t __p1) { 25852 uint64x2_t __ret; 25853 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 25854 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 25855 __ret = (uint64x2_t) __builtin_neon_vrshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 51); 25856 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 25857 return __ret; 25858 } 25859 #endif 25860 25861 #ifdef __LITTLE_ENDIAN__ 25862 __ai __attribute__((target("neon"))) uint16x8_t vrshlq_u16(uint16x8_t __p0, int16x8_t __p1) { 25863 uint16x8_t __ret; 25864 __ret = (uint16x8_t) __builtin_neon_vrshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 49); 25865 return __ret; 25866 } 25867 #else 25868 __ai __attribute__((target("neon"))) uint16x8_t vrshlq_u16(uint16x8_t __p0, int16x8_t __p1) { 25869 uint16x8_t __ret; 25870 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 25871 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 25872 __ret = (uint16x8_t) __builtin_neon_vrshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49); 25873 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 25874 return __ret; 25875 } 25876 #endif 25877 25878 #ifdef __LITTLE_ENDIAN__ 25879 __ai __attribute__((target("neon"))) int8x16_t vrshlq_s8(int8x16_t __p0, int8x16_t __p1) { 25880 int8x16_t __ret; 25881 __ret = (int8x16_t) __builtin_neon_vrshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 32); 25882 return __ret; 25883 } 25884 #else 25885 __ai __attribute__((target("neon"))) int8x16_t vrshlq_s8(int8x16_t __p0, int8x16_t __p1) { 25886 int8x16_t __ret; 25887 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 25888 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 25889 __ret = (int8x16_t) __builtin_neon_vrshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32); 25890 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 25891 return __ret; 25892 } 25893 #endif 25894 25895 #ifdef __LITTLE_ENDIAN__ 25896 __ai __attribute__((target("neon"))) int32x4_t vrshlq_s32(int32x4_t __p0, int32x4_t __p1) { 25897 int32x4_t __ret; 25898 __ret = (int32x4_t) __builtin_neon_vrshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 34); 25899 return __ret; 25900 } 25901 #else 25902 __ai __attribute__((target("neon"))) int32x4_t vrshlq_s32(int32x4_t __p0, int32x4_t __p1) { 25903 int32x4_t __ret; 25904 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 25905 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 25906 __ret = (int32x4_t) __builtin_neon_vrshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34); 25907 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 25908 return __ret; 25909 } 25910 #endif 25911 25912 #ifdef __LITTLE_ENDIAN__ 25913 __ai __attribute__((target("neon"))) int64x2_t vrshlq_s64(int64x2_t __p0, int64x2_t __p1) { 25914 int64x2_t __ret; 25915 __ret = (int64x2_t) __builtin_neon_vrshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 35); 25916 return __ret; 25917 } 25918 #else 25919 __ai __attribute__((target("neon"))) int64x2_t vrshlq_s64(int64x2_t __p0, int64x2_t __p1) { 25920 int64x2_t __ret; 25921 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 25922 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 25923 __ret = (int64x2_t) __builtin_neon_vrshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 35); 25924 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 25925 return __ret; 25926 } 25927 #endif 25928 25929 #ifdef __LITTLE_ENDIAN__ 25930 __ai __attribute__((target("neon"))) int16x8_t vrshlq_s16(int16x8_t __p0, int16x8_t __p1) { 25931 int16x8_t __ret; 25932 __ret = (int16x8_t) __builtin_neon_vrshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 33); 25933 return __ret; 25934 } 25935 #else 25936 __ai __attribute__((target("neon"))) int16x8_t vrshlq_s16(int16x8_t __p0, int16x8_t __p1) { 25937 int16x8_t __ret; 25938 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 25939 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 25940 __ret = (int16x8_t) __builtin_neon_vrshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33); 25941 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 25942 return __ret; 25943 } 25944 #endif 25945 25946 #ifdef __LITTLE_ENDIAN__ 25947 __ai __attribute__((target("neon"))) uint8x8_t vrshl_u8(uint8x8_t __p0, int8x8_t __p1) { 25948 uint8x8_t __ret; 25949 __ret = (uint8x8_t) __builtin_neon_vrshl_v((int8x8_t)__p0, (int8x8_t)__p1, 16); 25950 return __ret; 25951 } 25952 #else 25953 __ai __attribute__((target("neon"))) uint8x8_t vrshl_u8(uint8x8_t __p0, int8x8_t __p1) { 25954 uint8x8_t __ret; 25955 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 25956 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 25957 __ret = (uint8x8_t) __builtin_neon_vrshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16); 25958 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 25959 return __ret; 25960 } 25961 #endif 25962 25963 #ifdef __LITTLE_ENDIAN__ 25964 __ai __attribute__((target("neon"))) uint32x2_t vrshl_u32(uint32x2_t __p0, int32x2_t __p1) { 25965 uint32x2_t __ret; 25966 __ret = (uint32x2_t) __builtin_neon_vrshl_v((int8x8_t)__p0, (int8x8_t)__p1, 18); 25967 return __ret; 25968 } 25969 #else 25970 __ai __attribute__((target("neon"))) uint32x2_t vrshl_u32(uint32x2_t __p0, int32x2_t __p1) { 25971 uint32x2_t __ret; 25972 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 25973 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 25974 __ret = (uint32x2_t) __builtin_neon_vrshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18); 25975 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 25976 return __ret; 25977 } 25978 #endif 25979 25980 __ai __attribute__((target("neon"))) uint64x1_t vrshl_u64(uint64x1_t __p0, int64x1_t __p1) { 25981 uint64x1_t __ret; 25982 __ret = (uint64x1_t) __builtin_neon_vrshl_v((int8x8_t)__p0, (int8x8_t)__p1, 19); 25983 return __ret; 25984 } 25985 #ifdef __LITTLE_ENDIAN__ 25986 __ai __attribute__((target("neon"))) uint16x4_t vrshl_u16(uint16x4_t __p0, int16x4_t __p1) { 25987 uint16x4_t __ret; 25988 __ret = (uint16x4_t) __builtin_neon_vrshl_v((int8x8_t)__p0, (int8x8_t)__p1, 17); 25989 return __ret; 25990 } 25991 #else 25992 __ai __attribute__((target("neon"))) uint16x4_t vrshl_u16(uint16x4_t __p0, int16x4_t __p1) { 25993 uint16x4_t __ret; 25994 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 25995 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 25996 __ret = (uint16x4_t) __builtin_neon_vrshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17); 25997 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 25998 return __ret; 25999 } 26000 #endif 26001 26002 #ifdef __LITTLE_ENDIAN__ 26003 __ai __attribute__((target("neon"))) int8x8_t vrshl_s8(int8x8_t __p0, int8x8_t __p1) { 26004 int8x8_t __ret; 26005 __ret = (int8x8_t) __builtin_neon_vrshl_v((int8x8_t)__p0, (int8x8_t)__p1, 0); 26006 return __ret; 26007 } 26008 #else 26009 __ai __attribute__((target("neon"))) int8x8_t vrshl_s8(int8x8_t __p0, int8x8_t __p1) { 26010 int8x8_t __ret; 26011 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 26012 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 26013 __ret = (int8x8_t) __builtin_neon_vrshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0); 26014 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 26015 return __ret; 26016 } 26017 #endif 26018 26019 #ifdef __LITTLE_ENDIAN__ 26020 __ai __attribute__((target("neon"))) int32x2_t vrshl_s32(int32x2_t __p0, int32x2_t __p1) { 26021 int32x2_t __ret; 26022 __ret = (int32x2_t) __builtin_neon_vrshl_v((int8x8_t)__p0, (int8x8_t)__p1, 2); 26023 return __ret; 26024 } 26025 #else 26026 __ai __attribute__((target("neon"))) int32x2_t vrshl_s32(int32x2_t __p0, int32x2_t __p1) { 26027 int32x2_t __ret; 26028 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 26029 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 26030 __ret = (int32x2_t) __builtin_neon_vrshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2); 26031 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 26032 return __ret; 26033 } 26034 #endif 26035 26036 __ai __attribute__((target("neon"))) int64x1_t vrshl_s64(int64x1_t __p0, int64x1_t __p1) { 26037 int64x1_t __ret; 26038 __ret = (int64x1_t) __builtin_neon_vrshl_v((int8x8_t)__p0, (int8x8_t)__p1, 3); 26039 return __ret; 26040 } 26041 #ifdef __LITTLE_ENDIAN__ 26042 __ai __attribute__((target("neon"))) int16x4_t vrshl_s16(int16x4_t __p0, int16x4_t __p1) { 26043 int16x4_t __ret; 26044 __ret = (int16x4_t) __builtin_neon_vrshl_v((int8x8_t)__p0, (int8x8_t)__p1, 1); 26045 return __ret; 26046 } 26047 #else 26048 __ai __attribute__((target("neon"))) int16x4_t vrshl_s16(int16x4_t __p0, int16x4_t __p1) { 26049 int16x4_t __ret; 26050 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 26051 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 26052 __ret = (int16x4_t) __builtin_neon_vrshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1); 26053 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 26054 return __ret; 26055 } 26056 #endif 26057 26058 #ifdef __LITTLE_ENDIAN__ 26059 #define vrshrq_n_u8(__p0, __p1) __extension__ ({ \ 26060 uint8x16_t __ret; \ 26061 uint8x16_t __s0 = __p0; \ 26062 __ret = (uint8x16_t) __builtin_neon_vrshrq_n_v((int8x16_t)__s0, __p1, 48); \ 26063 __ret; \ 26064 }) 26065 #else 26066 #define vrshrq_n_u8(__p0, __p1) __extension__ ({ \ 26067 uint8x16_t __ret; \ 26068 uint8x16_t __s0 = __p0; \ 26069 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 26070 __ret = (uint8x16_t) __builtin_neon_vrshrq_n_v((int8x16_t)__rev0, __p1, 48); \ 26071 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 26072 __ret; \ 26073 }) 26074 #endif 26075 26076 #ifdef __LITTLE_ENDIAN__ 26077 #define vrshrq_n_u32(__p0, __p1) __extension__ ({ \ 26078 uint32x4_t __ret; \ 26079 uint32x4_t __s0 = __p0; \ 26080 __ret = (uint32x4_t) __builtin_neon_vrshrq_n_v((int8x16_t)__s0, __p1, 50); \ 26081 __ret; \ 26082 }) 26083 #else 26084 #define vrshrq_n_u32(__p0, __p1) __extension__ ({ \ 26085 uint32x4_t __ret; \ 26086 uint32x4_t __s0 = __p0; \ 26087 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 26088 __ret = (uint32x4_t) __builtin_neon_vrshrq_n_v((int8x16_t)__rev0, __p1, 50); \ 26089 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 26090 __ret; \ 26091 }) 26092 #endif 26093 26094 #ifdef __LITTLE_ENDIAN__ 26095 #define vrshrq_n_u64(__p0, __p1) __extension__ ({ \ 26096 uint64x2_t __ret; \ 26097 uint64x2_t __s0 = __p0; \ 26098 __ret = (uint64x2_t) __builtin_neon_vrshrq_n_v((int8x16_t)__s0, __p1, 51); \ 26099 __ret; \ 26100 }) 26101 #else 26102 #define vrshrq_n_u64(__p0, __p1) __extension__ ({ \ 26103 uint64x2_t __ret; \ 26104 uint64x2_t __s0 = __p0; \ 26105 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 26106 __ret = (uint64x2_t) __builtin_neon_vrshrq_n_v((int8x16_t)__rev0, __p1, 51); \ 26107 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 26108 __ret; \ 26109 }) 26110 #endif 26111 26112 #ifdef __LITTLE_ENDIAN__ 26113 #define vrshrq_n_u16(__p0, __p1) __extension__ ({ \ 26114 uint16x8_t __ret; \ 26115 uint16x8_t __s0 = __p0; \ 26116 __ret = (uint16x8_t) __builtin_neon_vrshrq_n_v((int8x16_t)__s0, __p1, 49); \ 26117 __ret; \ 26118 }) 26119 #else 26120 #define vrshrq_n_u16(__p0, __p1) __extension__ ({ \ 26121 uint16x8_t __ret; \ 26122 uint16x8_t __s0 = __p0; \ 26123 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 26124 __ret = (uint16x8_t) __builtin_neon_vrshrq_n_v((int8x16_t)__rev0, __p1, 49); \ 26125 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 26126 __ret; \ 26127 }) 26128 #endif 26129 26130 #ifdef __LITTLE_ENDIAN__ 26131 #define vrshrq_n_s8(__p0, __p1) __extension__ ({ \ 26132 int8x16_t __ret; \ 26133 int8x16_t __s0 = __p0; \ 26134 __ret = (int8x16_t) __builtin_neon_vrshrq_n_v((int8x16_t)__s0, __p1, 32); \ 26135 __ret; \ 26136 }) 26137 #else 26138 #define vrshrq_n_s8(__p0, __p1) __extension__ ({ \ 26139 int8x16_t __ret; \ 26140 int8x16_t __s0 = __p0; \ 26141 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 26142 __ret = (int8x16_t) __builtin_neon_vrshrq_n_v((int8x16_t)__rev0, __p1, 32); \ 26143 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 26144 __ret; \ 26145 }) 26146 #endif 26147 26148 #ifdef __LITTLE_ENDIAN__ 26149 #define vrshrq_n_s32(__p0, __p1) __extension__ ({ \ 26150 int32x4_t __ret; \ 26151 int32x4_t __s0 = __p0; \ 26152 __ret = (int32x4_t) __builtin_neon_vrshrq_n_v((int8x16_t)__s0, __p1, 34); \ 26153 __ret; \ 26154 }) 26155 #else 26156 #define vrshrq_n_s32(__p0, __p1) __extension__ ({ \ 26157 int32x4_t __ret; \ 26158 int32x4_t __s0 = __p0; \ 26159 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 26160 __ret = (int32x4_t) __builtin_neon_vrshrq_n_v((int8x16_t)__rev0, __p1, 34); \ 26161 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 26162 __ret; \ 26163 }) 26164 #endif 26165 26166 #ifdef __LITTLE_ENDIAN__ 26167 #define vrshrq_n_s64(__p0, __p1) __extension__ ({ \ 26168 int64x2_t __ret; \ 26169 int64x2_t __s0 = __p0; \ 26170 __ret = (int64x2_t) __builtin_neon_vrshrq_n_v((int8x16_t)__s0, __p1, 35); \ 26171 __ret; \ 26172 }) 26173 #else 26174 #define vrshrq_n_s64(__p0, __p1) __extension__ ({ \ 26175 int64x2_t __ret; \ 26176 int64x2_t __s0 = __p0; \ 26177 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 26178 __ret = (int64x2_t) __builtin_neon_vrshrq_n_v((int8x16_t)__rev0, __p1, 35); \ 26179 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 26180 __ret; \ 26181 }) 26182 #endif 26183 26184 #ifdef __LITTLE_ENDIAN__ 26185 #define vrshrq_n_s16(__p0, __p1) __extension__ ({ \ 26186 int16x8_t __ret; \ 26187 int16x8_t __s0 = __p0; \ 26188 __ret = (int16x8_t) __builtin_neon_vrshrq_n_v((int8x16_t)__s0, __p1, 33); \ 26189 __ret; \ 26190 }) 26191 #else 26192 #define vrshrq_n_s16(__p0, __p1) __extension__ ({ \ 26193 int16x8_t __ret; \ 26194 int16x8_t __s0 = __p0; \ 26195 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 26196 __ret = (int16x8_t) __builtin_neon_vrshrq_n_v((int8x16_t)__rev0, __p1, 33); \ 26197 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 26198 __ret; \ 26199 }) 26200 #endif 26201 26202 #ifdef __LITTLE_ENDIAN__ 26203 #define vrshr_n_u8(__p0, __p1) __extension__ ({ \ 26204 uint8x8_t __ret; \ 26205 uint8x8_t __s0 = __p0; \ 26206 __ret = (uint8x8_t) __builtin_neon_vrshr_n_v((int8x8_t)__s0, __p1, 16); \ 26207 __ret; \ 26208 }) 26209 #else 26210 #define vrshr_n_u8(__p0, __p1) __extension__ ({ \ 26211 uint8x8_t __ret; \ 26212 uint8x8_t __s0 = __p0; \ 26213 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 26214 __ret = (uint8x8_t) __builtin_neon_vrshr_n_v((int8x8_t)__rev0, __p1, 16); \ 26215 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 26216 __ret; \ 26217 }) 26218 #endif 26219 26220 #ifdef __LITTLE_ENDIAN__ 26221 #define vrshr_n_u32(__p0, __p1) __extension__ ({ \ 26222 uint32x2_t __ret; \ 26223 uint32x2_t __s0 = __p0; \ 26224 __ret = (uint32x2_t) __builtin_neon_vrshr_n_v((int8x8_t)__s0, __p1, 18); \ 26225 __ret; \ 26226 }) 26227 #else 26228 #define vrshr_n_u32(__p0, __p1) __extension__ ({ \ 26229 uint32x2_t __ret; \ 26230 uint32x2_t __s0 = __p0; \ 26231 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 26232 __ret = (uint32x2_t) __builtin_neon_vrshr_n_v((int8x8_t)__rev0, __p1, 18); \ 26233 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 26234 __ret; \ 26235 }) 26236 #endif 26237 26238 #define vrshr_n_u64(__p0, __p1) __extension__ ({ \ 26239 uint64x1_t __ret; \ 26240 uint64x1_t __s0 = __p0; \ 26241 __ret = (uint64x1_t) __builtin_neon_vrshr_n_v((int8x8_t)__s0, __p1, 19); \ 26242 __ret; \ 26243 }) 26244 #ifdef __LITTLE_ENDIAN__ 26245 #define vrshr_n_u16(__p0, __p1) __extension__ ({ \ 26246 uint16x4_t __ret; \ 26247 uint16x4_t __s0 = __p0; \ 26248 __ret = (uint16x4_t) __builtin_neon_vrshr_n_v((int8x8_t)__s0, __p1, 17); \ 26249 __ret; \ 26250 }) 26251 #else 26252 #define vrshr_n_u16(__p0, __p1) __extension__ ({ \ 26253 uint16x4_t __ret; \ 26254 uint16x4_t __s0 = __p0; \ 26255 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 26256 __ret = (uint16x4_t) __builtin_neon_vrshr_n_v((int8x8_t)__rev0, __p1, 17); \ 26257 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 26258 __ret; \ 26259 }) 26260 #endif 26261 26262 #ifdef __LITTLE_ENDIAN__ 26263 #define vrshr_n_s8(__p0, __p1) __extension__ ({ \ 26264 int8x8_t __ret; \ 26265 int8x8_t __s0 = __p0; \ 26266 __ret = (int8x8_t) __builtin_neon_vrshr_n_v((int8x8_t)__s0, __p1, 0); \ 26267 __ret; \ 26268 }) 26269 #else 26270 #define vrshr_n_s8(__p0, __p1) __extension__ ({ \ 26271 int8x8_t __ret; \ 26272 int8x8_t __s0 = __p0; \ 26273 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 26274 __ret = (int8x8_t) __builtin_neon_vrshr_n_v((int8x8_t)__rev0, __p1, 0); \ 26275 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 26276 __ret; \ 26277 }) 26278 #endif 26279 26280 #ifdef __LITTLE_ENDIAN__ 26281 #define vrshr_n_s32(__p0, __p1) __extension__ ({ \ 26282 int32x2_t __ret; \ 26283 int32x2_t __s0 = __p0; \ 26284 __ret = (int32x2_t) __builtin_neon_vrshr_n_v((int8x8_t)__s0, __p1, 2); \ 26285 __ret; \ 26286 }) 26287 #else 26288 #define vrshr_n_s32(__p0, __p1) __extension__ ({ \ 26289 int32x2_t __ret; \ 26290 int32x2_t __s0 = __p0; \ 26291 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 26292 __ret = (int32x2_t) __builtin_neon_vrshr_n_v((int8x8_t)__rev0, __p1, 2); \ 26293 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 26294 __ret; \ 26295 }) 26296 #endif 26297 26298 #define vrshr_n_s64(__p0, __p1) __extension__ ({ \ 26299 int64x1_t __ret; \ 26300 int64x1_t __s0 = __p0; \ 26301 __ret = (int64x1_t) __builtin_neon_vrshr_n_v((int8x8_t)__s0, __p1, 3); \ 26302 __ret; \ 26303 }) 26304 #ifdef __LITTLE_ENDIAN__ 26305 #define vrshr_n_s16(__p0, __p1) __extension__ ({ \ 26306 int16x4_t __ret; \ 26307 int16x4_t __s0 = __p0; \ 26308 __ret = (int16x4_t) __builtin_neon_vrshr_n_v((int8x8_t)__s0, __p1, 1); \ 26309 __ret; \ 26310 }) 26311 #else 26312 #define vrshr_n_s16(__p0, __p1) __extension__ ({ \ 26313 int16x4_t __ret; \ 26314 int16x4_t __s0 = __p0; \ 26315 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 26316 __ret = (int16x4_t) __builtin_neon_vrshr_n_v((int8x8_t)__rev0, __p1, 1); \ 26317 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 26318 __ret; \ 26319 }) 26320 #endif 26321 26322 #ifdef __LITTLE_ENDIAN__ 26323 #define vrshrn_n_u32(__p0, __p1) __extension__ ({ \ 26324 uint16x4_t __ret; \ 26325 uint32x4_t __s0 = __p0; \ 26326 __ret = (uint16x4_t) __builtin_neon_vrshrn_n_v((int8x16_t)__s0, __p1, 17); \ 26327 __ret; \ 26328 }) 26329 #else 26330 #define vrshrn_n_u32(__p0, __p1) __extension__ ({ \ 26331 uint16x4_t __ret; \ 26332 uint32x4_t __s0 = __p0; \ 26333 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 26334 __ret = (uint16x4_t) __builtin_neon_vrshrn_n_v((int8x16_t)__rev0, __p1, 17); \ 26335 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 26336 __ret; \ 26337 }) 26338 #define __noswap_vrshrn_n_u32(__p0, __p1) __extension__ ({ \ 26339 uint16x4_t __ret; \ 26340 uint32x4_t __s0 = __p0; \ 26341 __ret = (uint16x4_t) __builtin_neon_vrshrn_n_v((int8x16_t)__s0, __p1, 17); \ 26342 __ret; \ 26343 }) 26344 #endif 26345 26346 #ifdef __LITTLE_ENDIAN__ 26347 #define vrshrn_n_u64(__p0, __p1) __extension__ ({ \ 26348 uint32x2_t __ret; \ 26349 uint64x2_t __s0 = __p0; \ 26350 __ret = (uint32x2_t) __builtin_neon_vrshrn_n_v((int8x16_t)__s0, __p1, 18); \ 26351 __ret; \ 26352 }) 26353 #else 26354 #define vrshrn_n_u64(__p0, __p1) __extension__ ({ \ 26355 uint32x2_t __ret; \ 26356 uint64x2_t __s0 = __p0; \ 26357 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 26358 __ret = (uint32x2_t) __builtin_neon_vrshrn_n_v((int8x16_t)__rev0, __p1, 18); \ 26359 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 26360 __ret; \ 26361 }) 26362 #define __noswap_vrshrn_n_u64(__p0, __p1) __extension__ ({ \ 26363 uint32x2_t __ret; \ 26364 uint64x2_t __s0 = __p0; \ 26365 __ret = (uint32x2_t) __builtin_neon_vrshrn_n_v((int8x16_t)__s0, __p1, 18); \ 26366 __ret; \ 26367 }) 26368 #endif 26369 26370 #ifdef __LITTLE_ENDIAN__ 26371 #define vrshrn_n_u16(__p0, __p1) __extension__ ({ \ 26372 uint8x8_t __ret; \ 26373 uint16x8_t __s0 = __p0; \ 26374 __ret = (uint8x8_t) __builtin_neon_vrshrn_n_v((int8x16_t)__s0, __p1, 16); \ 26375 __ret; \ 26376 }) 26377 #else 26378 #define vrshrn_n_u16(__p0, __p1) __extension__ ({ \ 26379 uint8x8_t __ret; \ 26380 uint16x8_t __s0 = __p0; \ 26381 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 26382 __ret = (uint8x8_t) __builtin_neon_vrshrn_n_v((int8x16_t)__rev0, __p1, 16); \ 26383 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 26384 __ret; \ 26385 }) 26386 #define __noswap_vrshrn_n_u16(__p0, __p1) __extension__ ({ \ 26387 uint8x8_t __ret; \ 26388 uint16x8_t __s0 = __p0; \ 26389 __ret = (uint8x8_t) __builtin_neon_vrshrn_n_v((int8x16_t)__s0, __p1, 16); \ 26390 __ret; \ 26391 }) 26392 #endif 26393 26394 #ifdef __LITTLE_ENDIAN__ 26395 #define vrshrn_n_s32(__p0, __p1) __extension__ ({ \ 26396 int16x4_t __ret; \ 26397 int32x4_t __s0 = __p0; \ 26398 __ret = (int16x4_t) __builtin_neon_vrshrn_n_v((int8x16_t)__s0, __p1, 1); \ 26399 __ret; \ 26400 }) 26401 #else 26402 #define vrshrn_n_s32(__p0, __p1) __extension__ ({ \ 26403 int16x4_t __ret; \ 26404 int32x4_t __s0 = __p0; \ 26405 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 26406 __ret = (int16x4_t) __builtin_neon_vrshrn_n_v((int8x16_t)__rev0, __p1, 1); \ 26407 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 26408 __ret; \ 26409 }) 26410 #define __noswap_vrshrn_n_s32(__p0, __p1) __extension__ ({ \ 26411 int16x4_t __ret; \ 26412 int32x4_t __s0 = __p0; \ 26413 __ret = (int16x4_t) __builtin_neon_vrshrn_n_v((int8x16_t)__s0, __p1, 1); \ 26414 __ret; \ 26415 }) 26416 #endif 26417 26418 #ifdef __LITTLE_ENDIAN__ 26419 #define vrshrn_n_s64(__p0, __p1) __extension__ ({ \ 26420 int32x2_t __ret; \ 26421 int64x2_t __s0 = __p0; \ 26422 __ret = (int32x2_t) __builtin_neon_vrshrn_n_v((int8x16_t)__s0, __p1, 2); \ 26423 __ret; \ 26424 }) 26425 #else 26426 #define vrshrn_n_s64(__p0, __p1) __extension__ ({ \ 26427 int32x2_t __ret; \ 26428 int64x2_t __s0 = __p0; \ 26429 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 26430 __ret = (int32x2_t) __builtin_neon_vrshrn_n_v((int8x16_t)__rev0, __p1, 2); \ 26431 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 26432 __ret; \ 26433 }) 26434 #define __noswap_vrshrn_n_s64(__p0, __p1) __extension__ ({ \ 26435 int32x2_t __ret; \ 26436 int64x2_t __s0 = __p0; \ 26437 __ret = (int32x2_t) __builtin_neon_vrshrn_n_v((int8x16_t)__s0, __p1, 2); \ 26438 __ret; \ 26439 }) 26440 #endif 26441 26442 #ifdef __LITTLE_ENDIAN__ 26443 #define vrshrn_n_s16(__p0, __p1) __extension__ ({ \ 26444 int8x8_t __ret; \ 26445 int16x8_t __s0 = __p0; \ 26446 __ret = (int8x8_t) __builtin_neon_vrshrn_n_v((int8x16_t)__s0, __p1, 0); \ 26447 __ret; \ 26448 }) 26449 #else 26450 #define vrshrn_n_s16(__p0, __p1) __extension__ ({ \ 26451 int8x8_t __ret; \ 26452 int16x8_t __s0 = __p0; \ 26453 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 26454 __ret = (int8x8_t) __builtin_neon_vrshrn_n_v((int8x16_t)__rev0, __p1, 0); \ 26455 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 26456 __ret; \ 26457 }) 26458 #define __noswap_vrshrn_n_s16(__p0, __p1) __extension__ ({ \ 26459 int8x8_t __ret; \ 26460 int16x8_t __s0 = __p0; \ 26461 __ret = (int8x8_t) __builtin_neon_vrshrn_n_v((int8x16_t)__s0, __p1, 0); \ 26462 __ret; \ 26463 }) 26464 #endif 26465 26466 #ifdef __LITTLE_ENDIAN__ 26467 __ai __attribute__((target("neon"))) uint32x4_t vrsqrteq_u32(uint32x4_t __p0) { 26468 uint32x4_t __ret; 26469 __ret = (uint32x4_t) __builtin_neon_vrsqrteq_v((int8x16_t)__p0, 50); 26470 return __ret; 26471 } 26472 #else 26473 __ai __attribute__((target("neon"))) uint32x4_t vrsqrteq_u32(uint32x4_t __p0) { 26474 uint32x4_t __ret; 26475 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 26476 __ret = (uint32x4_t) __builtin_neon_vrsqrteq_v((int8x16_t)__rev0, 50); 26477 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 26478 return __ret; 26479 } 26480 #endif 26481 26482 #ifdef __LITTLE_ENDIAN__ 26483 __ai __attribute__((target("neon"))) float32x4_t vrsqrteq_f32(float32x4_t __p0) { 26484 float32x4_t __ret; 26485 __ret = (float32x4_t) __builtin_neon_vrsqrteq_v((int8x16_t)__p0, 41); 26486 return __ret; 26487 } 26488 #else 26489 __ai __attribute__((target("neon"))) float32x4_t vrsqrteq_f32(float32x4_t __p0) { 26490 float32x4_t __ret; 26491 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 26492 __ret = (float32x4_t) __builtin_neon_vrsqrteq_v((int8x16_t)__rev0, 41); 26493 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 26494 return __ret; 26495 } 26496 #endif 26497 26498 #ifdef __LITTLE_ENDIAN__ 26499 __ai __attribute__((target("neon"))) uint32x2_t vrsqrte_u32(uint32x2_t __p0) { 26500 uint32x2_t __ret; 26501 __ret = (uint32x2_t) __builtin_neon_vrsqrte_v((int8x8_t)__p0, 18); 26502 return __ret; 26503 } 26504 #else 26505 __ai __attribute__((target("neon"))) uint32x2_t vrsqrte_u32(uint32x2_t __p0) { 26506 uint32x2_t __ret; 26507 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 26508 __ret = (uint32x2_t) __builtin_neon_vrsqrte_v((int8x8_t)__rev0, 18); 26509 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 26510 return __ret; 26511 } 26512 #endif 26513 26514 #ifdef __LITTLE_ENDIAN__ 26515 __ai __attribute__((target("neon"))) float32x2_t vrsqrte_f32(float32x2_t __p0) { 26516 float32x2_t __ret; 26517 __ret = (float32x2_t) __builtin_neon_vrsqrte_v((int8x8_t)__p0, 9); 26518 return __ret; 26519 } 26520 #else 26521 __ai __attribute__((target("neon"))) float32x2_t vrsqrte_f32(float32x2_t __p0) { 26522 float32x2_t __ret; 26523 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 26524 __ret = (float32x2_t) __builtin_neon_vrsqrte_v((int8x8_t)__rev0, 9); 26525 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 26526 return __ret; 26527 } 26528 #endif 26529 26530 #ifdef __LITTLE_ENDIAN__ 26531 __ai __attribute__((target("neon"))) float32x4_t vrsqrtsq_f32(float32x4_t __p0, float32x4_t __p1) { 26532 float32x4_t __ret; 26533 __ret = (float32x4_t) __builtin_neon_vrsqrtsq_v((int8x16_t)__p0, (int8x16_t)__p1, 41); 26534 return __ret; 26535 } 26536 #else 26537 __ai __attribute__((target("neon"))) float32x4_t vrsqrtsq_f32(float32x4_t __p0, float32x4_t __p1) { 26538 float32x4_t __ret; 26539 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 26540 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 26541 __ret = (float32x4_t) __builtin_neon_vrsqrtsq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 41); 26542 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 26543 return __ret; 26544 } 26545 #endif 26546 26547 #ifdef __LITTLE_ENDIAN__ 26548 __ai __attribute__((target("neon"))) float32x2_t vrsqrts_f32(float32x2_t __p0, float32x2_t __p1) { 26549 float32x2_t __ret; 26550 __ret = (float32x2_t) __builtin_neon_vrsqrts_v((int8x8_t)__p0, (int8x8_t)__p1, 9); 26551 return __ret; 26552 } 26553 #else 26554 __ai __attribute__((target("neon"))) float32x2_t vrsqrts_f32(float32x2_t __p0, float32x2_t __p1) { 26555 float32x2_t __ret; 26556 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 26557 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 26558 __ret = (float32x2_t) __builtin_neon_vrsqrts_v((int8x8_t)__rev0, (int8x8_t)__rev1, 9); 26559 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 26560 return __ret; 26561 } 26562 #endif 26563 26564 #ifdef __LITTLE_ENDIAN__ 26565 #define vrsraq_n_u8(__p0, __p1, __p2) __extension__ ({ \ 26566 uint8x16_t __ret; \ 26567 uint8x16_t __s0 = __p0; \ 26568 uint8x16_t __s1 = __p1; \ 26569 __ret = (uint8x16_t) __builtin_neon_vrsraq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 48); \ 26570 __ret; \ 26571 }) 26572 #else 26573 #define vrsraq_n_u8(__p0, __p1, __p2) __extension__ ({ \ 26574 uint8x16_t __ret; \ 26575 uint8x16_t __s0 = __p0; \ 26576 uint8x16_t __s1 = __p1; \ 26577 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 26578 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 26579 __ret = (uint8x16_t) __builtin_neon_vrsraq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 48); \ 26580 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 26581 __ret; \ 26582 }) 26583 #endif 26584 26585 #ifdef __LITTLE_ENDIAN__ 26586 #define vrsraq_n_u32(__p0, __p1, __p2) __extension__ ({ \ 26587 uint32x4_t __ret; \ 26588 uint32x4_t __s0 = __p0; \ 26589 uint32x4_t __s1 = __p1; \ 26590 __ret = (uint32x4_t) __builtin_neon_vrsraq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 50); \ 26591 __ret; \ 26592 }) 26593 #else 26594 #define vrsraq_n_u32(__p0, __p1, __p2) __extension__ ({ \ 26595 uint32x4_t __ret; \ 26596 uint32x4_t __s0 = __p0; \ 26597 uint32x4_t __s1 = __p1; \ 26598 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 26599 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 26600 __ret = (uint32x4_t) __builtin_neon_vrsraq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 50); \ 26601 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 26602 __ret; \ 26603 }) 26604 #endif 26605 26606 #ifdef __LITTLE_ENDIAN__ 26607 #define vrsraq_n_u64(__p0, __p1, __p2) __extension__ ({ \ 26608 uint64x2_t __ret; \ 26609 uint64x2_t __s0 = __p0; \ 26610 uint64x2_t __s1 = __p1; \ 26611 __ret = (uint64x2_t) __builtin_neon_vrsraq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 51); \ 26612 __ret; \ 26613 }) 26614 #else 26615 #define vrsraq_n_u64(__p0, __p1, __p2) __extension__ ({ \ 26616 uint64x2_t __ret; \ 26617 uint64x2_t __s0 = __p0; \ 26618 uint64x2_t __s1 = __p1; \ 26619 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 26620 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 26621 __ret = (uint64x2_t) __builtin_neon_vrsraq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 51); \ 26622 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 26623 __ret; \ 26624 }) 26625 #endif 26626 26627 #ifdef __LITTLE_ENDIAN__ 26628 #define vrsraq_n_u16(__p0, __p1, __p2) __extension__ ({ \ 26629 uint16x8_t __ret; \ 26630 uint16x8_t __s0 = __p0; \ 26631 uint16x8_t __s1 = __p1; \ 26632 __ret = (uint16x8_t) __builtin_neon_vrsraq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 49); \ 26633 __ret; \ 26634 }) 26635 #else 26636 #define vrsraq_n_u16(__p0, __p1, __p2) __extension__ ({ \ 26637 uint16x8_t __ret; \ 26638 uint16x8_t __s0 = __p0; \ 26639 uint16x8_t __s1 = __p1; \ 26640 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 26641 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 26642 __ret = (uint16x8_t) __builtin_neon_vrsraq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 49); \ 26643 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 26644 __ret; \ 26645 }) 26646 #endif 26647 26648 #ifdef __LITTLE_ENDIAN__ 26649 #define vrsraq_n_s8(__p0, __p1, __p2) __extension__ ({ \ 26650 int8x16_t __ret; \ 26651 int8x16_t __s0 = __p0; \ 26652 int8x16_t __s1 = __p1; \ 26653 __ret = (int8x16_t) __builtin_neon_vrsraq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 32); \ 26654 __ret; \ 26655 }) 26656 #else 26657 #define vrsraq_n_s8(__p0, __p1, __p2) __extension__ ({ \ 26658 int8x16_t __ret; \ 26659 int8x16_t __s0 = __p0; \ 26660 int8x16_t __s1 = __p1; \ 26661 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 26662 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 26663 __ret = (int8x16_t) __builtin_neon_vrsraq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 32); \ 26664 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 26665 __ret; \ 26666 }) 26667 #endif 26668 26669 #ifdef __LITTLE_ENDIAN__ 26670 #define vrsraq_n_s32(__p0, __p1, __p2) __extension__ ({ \ 26671 int32x4_t __ret; \ 26672 int32x4_t __s0 = __p0; \ 26673 int32x4_t __s1 = __p1; \ 26674 __ret = (int32x4_t) __builtin_neon_vrsraq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 34); \ 26675 __ret; \ 26676 }) 26677 #else 26678 #define vrsraq_n_s32(__p0, __p1, __p2) __extension__ ({ \ 26679 int32x4_t __ret; \ 26680 int32x4_t __s0 = __p0; \ 26681 int32x4_t __s1 = __p1; \ 26682 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 26683 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 26684 __ret = (int32x4_t) __builtin_neon_vrsraq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 34); \ 26685 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 26686 __ret; \ 26687 }) 26688 #endif 26689 26690 #ifdef __LITTLE_ENDIAN__ 26691 #define vrsraq_n_s64(__p0, __p1, __p2) __extension__ ({ \ 26692 int64x2_t __ret; \ 26693 int64x2_t __s0 = __p0; \ 26694 int64x2_t __s1 = __p1; \ 26695 __ret = (int64x2_t) __builtin_neon_vrsraq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 35); \ 26696 __ret; \ 26697 }) 26698 #else 26699 #define vrsraq_n_s64(__p0, __p1, __p2) __extension__ ({ \ 26700 int64x2_t __ret; \ 26701 int64x2_t __s0 = __p0; \ 26702 int64x2_t __s1 = __p1; \ 26703 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 26704 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 26705 __ret = (int64x2_t) __builtin_neon_vrsraq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 35); \ 26706 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 26707 __ret; \ 26708 }) 26709 #endif 26710 26711 #ifdef __LITTLE_ENDIAN__ 26712 #define vrsraq_n_s16(__p0, __p1, __p2) __extension__ ({ \ 26713 int16x8_t __ret; \ 26714 int16x8_t __s0 = __p0; \ 26715 int16x8_t __s1 = __p1; \ 26716 __ret = (int16x8_t) __builtin_neon_vrsraq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 33); \ 26717 __ret; \ 26718 }) 26719 #else 26720 #define vrsraq_n_s16(__p0, __p1, __p2) __extension__ ({ \ 26721 int16x8_t __ret; \ 26722 int16x8_t __s0 = __p0; \ 26723 int16x8_t __s1 = __p1; \ 26724 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 26725 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 26726 __ret = (int16x8_t) __builtin_neon_vrsraq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 33); \ 26727 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 26728 __ret; \ 26729 }) 26730 #endif 26731 26732 #ifdef __LITTLE_ENDIAN__ 26733 #define vrsra_n_u8(__p0, __p1, __p2) __extension__ ({ \ 26734 uint8x8_t __ret; \ 26735 uint8x8_t __s0 = __p0; \ 26736 uint8x8_t __s1 = __p1; \ 26737 __ret = (uint8x8_t) __builtin_neon_vrsra_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 16); \ 26738 __ret; \ 26739 }) 26740 #else 26741 #define vrsra_n_u8(__p0, __p1, __p2) __extension__ ({ \ 26742 uint8x8_t __ret; \ 26743 uint8x8_t __s0 = __p0; \ 26744 uint8x8_t __s1 = __p1; \ 26745 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 26746 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 26747 __ret = (uint8x8_t) __builtin_neon_vrsra_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 16); \ 26748 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 26749 __ret; \ 26750 }) 26751 #endif 26752 26753 #ifdef __LITTLE_ENDIAN__ 26754 #define vrsra_n_u32(__p0, __p1, __p2) __extension__ ({ \ 26755 uint32x2_t __ret; \ 26756 uint32x2_t __s0 = __p0; \ 26757 uint32x2_t __s1 = __p1; \ 26758 __ret = (uint32x2_t) __builtin_neon_vrsra_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 18); \ 26759 __ret; \ 26760 }) 26761 #else 26762 #define vrsra_n_u32(__p0, __p1, __p2) __extension__ ({ \ 26763 uint32x2_t __ret; \ 26764 uint32x2_t __s0 = __p0; \ 26765 uint32x2_t __s1 = __p1; \ 26766 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 26767 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 26768 __ret = (uint32x2_t) __builtin_neon_vrsra_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 18); \ 26769 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 26770 __ret; \ 26771 }) 26772 #endif 26773 26774 #define vrsra_n_u64(__p0, __p1, __p2) __extension__ ({ \ 26775 uint64x1_t __ret; \ 26776 uint64x1_t __s0 = __p0; \ 26777 uint64x1_t __s1 = __p1; \ 26778 __ret = (uint64x1_t) __builtin_neon_vrsra_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 19); \ 26779 __ret; \ 26780 }) 26781 #ifdef __LITTLE_ENDIAN__ 26782 #define vrsra_n_u16(__p0, __p1, __p2) __extension__ ({ \ 26783 uint16x4_t __ret; \ 26784 uint16x4_t __s0 = __p0; \ 26785 uint16x4_t __s1 = __p1; \ 26786 __ret = (uint16x4_t) __builtin_neon_vrsra_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 17); \ 26787 __ret; \ 26788 }) 26789 #else 26790 #define vrsra_n_u16(__p0, __p1, __p2) __extension__ ({ \ 26791 uint16x4_t __ret; \ 26792 uint16x4_t __s0 = __p0; \ 26793 uint16x4_t __s1 = __p1; \ 26794 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 26795 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 26796 __ret = (uint16x4_t) __builtin_neon_vrsra_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 17); \ 26797 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 26798 __ret; \ 26799 }) 26800 #endif 26801 26802 #ifdef __LITTLE_ENDIAN__ 26803 #define vrsra_n_s8(__p0, __p1, __p2) __extension__ ({ \ 26804 int8x8_t __ret; \ 26805 int8x8_t __s0 = __p0; \ 26806 int8x8_t __s1 = __p1; \ 26807 __ret = (int8x8_t) __builtin_neon_vrsra_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 0); \ 26808 __ret; \ 26809 }) 26810 #else 26811 #define vrsra_n_s8(__p0, __p1, __p2) __extension__ ({ \ 26812 int8x8_t __ret; \ 26813 int8x8_t __s0 = __p0; \ 26814 int8x8_t __s1 = __p1; \ 26815 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 26816 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 26817 __ret = (int8x8_t) __builtin_neon_vrsra_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 0); \ 26818 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 26819 __ret; \ 26820 }) 26821 #endif 26822 26823 #ifdef __LITTLE_ENDIAN__ 26824 #define vrsra_n_s32(__p0, __p1, __p2) __extension__ ({ \ 26825 int32x2_t __ret; \ 26826 int32x2_t __s0 = __p0; \ 26827 int32x2_t __s1 = __p1; \ 26828 __ret = (int32x2_t) __builtin_neon_vrsra_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 2); \ 26829 __ret; \ 26830 }) 26831 #else 26832 #define vrsra_n_s32(__p0, __p1, __p2) __extension__ ({ \ 26833 int32x2_t __ret; \ 26834 int32x2_t __s0 = __p0; \ 26835 int32x2_t __s1 = __p1; \ 26836 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 26837 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 26838 __ret = (int32x2_t) __builtin_neon_vrsra_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 2); \ 26839 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 26840 __ret; \ 26841 }) 26842 #endif 26843 26844 #define vrsra_n_s64(__p0, __p1, __p2) __extension__ ({ \ 26845 int64x1_t __ret; \ 26846 int64x1_t __s0 = __p0; \ 26847 int64x1_t __s1 = __p1; \ 26848 __ret = (int64x1_t) __builtin_neon_vrsra_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 3); \ 26849 __ret; \ 26850 }) 26851 #ifdef __LITTLE_ENDIAN__ 26852 #define vrsra_n_s16(__p0, __p1, __p2) __extension__ ({ \ 26853 int16x4_t __ret; \ 26854 int16x4_t __s0 = __p0; \ 26855 int16x4_t __s1 = __p1; \ 26856 __ret = (int16x4_t) __builtin_neon_vrsra_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 1); \ 26857 __ret; \ 26858 }) 26859 #else 26860 #define vrsra_n_s16(__p0, __p1, __p2) __extension__ ({ \ 26861 int16x4_t __ret; \ 26862 int16x4_t __s0 = __p0; \ 26863 int16x4_t __s1 = __p1; \ 26864 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 26865 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 26866 __ret = (int16x4_t) __builtin_neon_vrsra_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 1); \ 26867 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 26868 __ret; \ 26869 }) 26870 #endif 26871 26872 #ifdef __LITTLE_ENDIAN__ 26873 __ai __attribute__((target("neon"))) uint16x4_t vrsubhn_u32(uint32x4_t __p0, uint32x4_t __p1) { 26874 uint16x4_t __ret; 26875 __ret = (uint16x4_t) __builtin_neon_vrsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 17); 26876 return __ret; 26877 } 26878 #else 26879 __ai __attribute__((target("neon"))) uint16x4_t vrsubhn_u32(uint32x4_t __p0, uint32x4_t __p1) { 26880 uint16x4_t __ret; 26881 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 26882 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 26883 __ret = (uint16x4_t) __builtin_neon_vrsubhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 17); 26884 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 26885 return __ret; 26886 } 26887 __ai __attribute__((target("neon"))) uint16x4_t __noswap_vrsubhn_u32(uint32x4_t __p0, uint32x4_t __p1) { 26888 uint16x4_t __ret; 26889 __ret = (uint16x4_t) __builtin_neon_vrsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 17); 26890 return __ret; 26891 } 26892 #endif 26893 26894 #ifdef __LITTLE_ENDIAN__ 26895 __ai __attribute__((target("neon"))) uint32x2_t vrsubhn_u64(uint64x2_t __p0, uint64x2_t __p1) { 26896 uint32x2_t __ret; 26897 __ret = (uint32x2_t) __builtin_neon_vrsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 18); 26898 return __ret; 26899 } 26900 #else 26901 __ai __attribute__((target("neon"))) uint32x2_t vrsubhn_u64(uint64x2_t __p0, uint64x2_t __p1) { 26902 uint32x2_t __ret; 26903 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 26904 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 26905 __ret = (uint32x2_t) __builtin_neon_vrsubhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 18); 26906 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 26907 return __ret; 26908 } 26909 __ai __attribute__((target("neon"))) uint32x2_t __noswap_vrsubhn_u64(uint64x2_t __p0, uint64x2_t __p1) { 26910 uint32x2_t __ret; 26911 __ret = (uint32x2_t) __builtin_neon_vrsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 18); 26912 return __ret; 26913 } 26914 #endif 26915 26916 #ifdef __LITTLE_ENDIAN__ 26917 __ai __attribute__((target("neon"))) uint8x8_t vrsubhn_u16(uint16x8_t __p0, uint16x8_t __p1) { 26918 uint8x8_t __ret; 26919 __ret = (uint8x8_t) __builtin_neon_vrsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 16); 26920 return __ret; 26921 } 26922 #else 26923 __ai __attribute__((target("neon"))) uint8x8_t vrsubhn_u16(uint16x8_t __p0, uint16x8_t __p1) { 26924 uint8x8_t __ret; 26925 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 26926 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 26927 __ret = (uint8x8_t) __builtin_neon_vrsubhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 16); 26928 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 26929 return __ret; 26930 } 26931 __ai __attribute__((target("neon"))) uint8x8_t __noswap_vrsubhn_u16(uint16x8_t __p0, uint16x8_t __p1) { 26932 uint8x8_t __ret; 26933 __ret = (uint8x8_t) __builtin_neon_vrsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 16); 26934 return __ret; 26935 } 26936 #endif 26937 26938 #ifdef __LITTLE_ENDIAN__ 26939 __ai __attribute__((target("neon"))) int16x4_t vrsubhn_s32(int32x4_t __p0, int32x4_t __p1) { 26940 int16x4_t __ret; 26941 __ret = (int16x4_t) __builtin_neon_vrsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 1); 26942 return __ret; 26943 } 26944 #else 26945 __ai __attribute__((target("neon"))) int16x4_t vrsubhn_s32(int32x4_t __p0, int32x4_t __p1) { 26946 int16x4_t __ret; 26947 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 26948 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 26949 __ret = (int16x4_t) __builtin_neon_vrsubhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 1); 26950 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 26951 return __ret; 26952 } 26953 __ai __attribute__((target("neon"))) int16x4_t __noswap_vrsubhn_s32(int32x4_t __p0, int32x4_t __p1) { 26954 int16x4_t __ret; 26955 __ret = (int16x4_t) __builtin_neon_vrsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 1); 26956 return __ret; 26957 } 26958 #endif 26959 26960 #ifdef __LITTLE_ENDIAN__ 26961 __ai __attribute__((target("neon"))) int32x2_t vrsubhn_s64(int64x2_t __p0, int64x2_t __p1) { 26962 int32x2_t __ret; 26963 __ret = (int32x2_t) __builtin_neon_vrsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 2); 26964 return __ret; 26965 } 26966 #else 26967 __ai __attribute__((target("neon"))) int32x2_t vrsubhn_s64(int64x2_t __p0, int64x2_t __p1) { 26968 int32x2_t __ret; 26969 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 26970 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 26971 __ret = (int32x2_t) __builtin_neon_vrsubhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 2); 26972 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 26973 return __ret; 26974 } 26975 __ai __attribute__((target("neon"))) int32x2_t __noswap_vrsubhn_s64(int64x2_t __p0, int64x2_t __p1) { 26976 int32x2_t __ret; 26977 __ret = (int32x2_t) __builtin_neon_vrsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 2); 26978 return __ret; 26979 } 26980 #endif 26981 26982 #ifdef __LITTLE_ENDIAN__ 26983 __ai __attribute__((target("neon"))) int8x8_t vrsubhn_s16(int16x8_t __p0, int16x8_t __p1) { 26984 int8x8_t __ret; 26985 __ret = (int8x8_t) __builtin_neon_vrsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 0); 26986 return __ret; 26987 } 26988 #else 26989 __ai __attribute__((target("neon"))) int8x8_t vrsubhn_s16(int16x8_t __p0, int16x8_t __p1) { 26990 int8x8_t __ret; 26991 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 26992 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 26993 __ret = (int8x8_t) __builtin_neon_vrsubhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 0); 26994 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 26995 return __ret; 26996 } 26997 __ai __attribute__((target("neon"))) int8x8_t __noswap_vrsubhn_s16(int16x8_t __p0, int16x8_t __p1) { 26998 int8x8_t __ret; 26999 __ret = (int8x8_t) __builtin_neon_vrsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 0); 27000 return __ret; 27001 } 27002 #endif 27003 27004 #ifdef __LITTLE_ENDIAN__ 27005 #define vset_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 27006 poly8x8_t __ret; \ 27007 poly8_t __s0 = __p0; \ 27008 poly8x8_t __s1 = __p1; \ 27009 __ret = (poly8x8_t) __builtin_neon_vset_lane_i8(__s0, (poly8x8_t)__s1, __p2); \ 27010 __ret; \ 27011 }) 27012 #else 27013 #define vset_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 27014 poly8x8_t __ret; \ 27015 poly8_t __s0 = __p0; \ 27016 poly8x8_t __s1 = __p1; \ 27017 poly8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 27018 __ret = (poly8x8_t) __builtin_neon_vset_lane_i8(__s0, (poly8x8_t)__rev1, __p2); \ 27019 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 27020 __ret; \ 27021 }) 27022 #define __noswap_vset_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 27023 poly8x8_t __ret; \ 27024 poly8_t __s0 = __p0; \ 27025 poly8x8_t __s1 = __p1; \ 27026 __ret = (poly8x8_t) __builtin_neon_vset_lane_i8(__s0, (poly8x8_t)__s1, __p2); \ 27027 __ret; \ 27028 }) 27029 #endif 27030 27031 #ifdef __LITTLE_ENDIAN__ 27032 #define vset_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 27033 poly16x4_t __ret; \ 27034 poly16_t __s0 = __p0; \ 27035 poly16x4_t __s1 = __p1; \ 27036 __ret = (poly16x4_t) __builtin_neon_vset_lane_i16(__s0, (poly16x4_t)__s1, __p2); \ 27037 __ret; \ 27038 }) 27039 #else 27040 #define vset_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 27041 poly16x4_t __ret; \ 27042 poly16_t __s0 = __p0; \ 27043 poly16x4_t __s1 = __p1; \ 27044 poly16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 27045 __ret = (poly16x4_t) __builtin_neon_vset_lane_i16(__s0, (poly16x4_t)__rev1, __p2); \ 27046 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 27047 __ret; \ 27048 }) 27049 #define __noswap_vset_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 27050 poly16x4_t __ret; \ 27051 poly16_t __s0 = __p0; \ 27052 poly16x4_t __s1 = __p1; \ 27053 __ret = (poly16x4_t) __builtin_neon_vset_lane_i16(__s0, (poly16x4_t)__s1, __p2); \ 27054 __ret; \ 27055 }) 27056 #endif 27057 27058 #ifdef __LITTLE_ENDIAN__ 27059 #define vsetq_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 27060 poly8x16_t __ret; \ 27061 poly8_t __s0 = __p0; \ 27062 poly8x16_t __s1 = __p1; \ 27063 __ret = (poly8x16_t) __builtin_neon_vsetq_lane_i8(__s0, (poly8x16_t)__s1, __p2); \ 27064 __ret; \ 27065 }) 27066 #else 27067 #define vsetq_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 27068 poly8x16_t __ret; \ 27069 poly8_t __s0 = __p0; \ 27070 poly8x16_t __s1 = __p1; \ 27071 poly8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 27072 __ret = (poly8x16_t) __builtin_neon_vsetq_lane_i8(__s0, (poly8x16_t)__rev1, __p2); \ 27073 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 27074 __ret; \ 27075 }) 27076 #define __noswap_vsetq_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 27077 poly8x16_t __ret; \ 27078 poly8_t __s0 = __p0; \ 27079 poly8x16_t __s1 = __p1; \ 27080 __ret = (poly8x16_t) __builtin_neon_vsetq_lane_i8(__s0, (poly8x16_t)__s1, __p2); \ 27081 __ret; \ 27082 }) 27083 #endif 27084 27085 #ifdef __LITTLE_ENDIAN__ 27086 #define vsetq_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 27087 poly16x8_t __ret; \ 27088 poly16_t __s0 = __p0; \ 27089 poly16x8_t __s1 = __p1; \ 27090 __ret = (poly16x8_t) __builtin_neon_vsetq_lane_i16(__s0, (poly16x8_t)__s1, __p2); \ 27091 __ret; \ 27092 }) 27093 #else 27094 #define vsetq_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 27095 poly16x8_t __ret; \ 27096 poly16_t __s0 = __p0; \ 27097 poly16x8_t __s1 = __p1; \ 27098 poly16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 27099 __ret = (poly16x8_t) __builtin_neon_vsetq_lane_i16(__s0, (poly16x8_t)__rev1, __p2); \ 27100 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 27101 __ret; \ 27102 }) 27103 #define __noswap_vsetq_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 27104 poly16x8_t __ret; \ 27105 poly16_t __s0 = __p0; \ 27106 poly16x8_t __s1 = __p1; \ 27107 __ret = (poly16x8_t) __builtin_neon_vsetq_lane_i16(__s0, (poly16x8_t)__s1, __p2); \ 27108 __ret; \ 27109 }) 27110 #endif 27111 27112 #ifdef __LITTLE_ENDIAN__ 27113 #define vsetq_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 27114 uint8x16_t __ret; \ 27115 uint8_t __s0 = __p0; \ 27116 uint8x16_t __s1 = __p1; \ 27117 __ret = (uint8x16_t) __builtin_neon_vsetq_lane_i8(__s0, (int8x16_t)__s1, __p2); \ 27118 __ret; \ 27119 }) 27120 #else 27121 #define vsetq_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 27122 uint8x16_t __ret; \ 27123 uint8_t __s0 = __p0; \ 27124 uint8x16_t __s1 = __p1; \ 27125 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 27126 __ret = (uint8x16_t) __builtin_neon_vsetq_lane_i8(__s0, (int8x16_t)__rev1, __p2); \ 27127 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 27128 __ret; \ 27129 }) 27130 #define __noswap_vsetq_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 27131 uint8x16_t __ret; \ 27132 uint8_t __s0 = __p0; \ 27133 uint8x16_t __s1 = __p1; \ 27134 __ret = (uint8x16_t) __builtin_neon_vsetq_lane_i8(__s0, (int8x16_t)__s1, __p2); \ 27135 __ret; \ 27136 }) 27137 #endif 27138 27139 #ifdef __LITTLE_ENDIAN__ 27140 #define vsetq_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 27141 uint32x4_t __ret; \ 27142 uint32_t __s0 = __p0; \ 27143 uint32x4_t __s1 = __p1; \ 27144 __ret = (uint32x4_t) __builtin_neon_vsetq_lane_i32(__s0, (int32x4_t)__s1, __p2); \ 27145 __ret; \ 27146 }) 27147 #else 27148 #define vsetq_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 27149 uint32x4_t __ret; \ 27150 uint32_t __s0 = __p0; \ 27151 uint32x4_t __s1 = __p1; \ 27152 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 27153 __ret = (uint32x4_t) __builtin_neon_vsetq_lane_i32(__s0, (int32x4_t)__rev1, __p2); \ 27154 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 27155 __ret; \ 27156 }) 27157 #define __noswap_vsetq_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 27158 uint32x4_t __ret; \ 27159 uint32_t __s0 = __p0; \ 27160 uint32x4_t __s1 = __p1; \ 27161 __ret = (uint32x4_t) __builtin_neon_vsetq_lane_i32(__s0, (int32x4_t)__s1, __p2); \ 27162 __ret; \ 27163 }) 27164 #endif 27165 27166 #ifdef __LITTLE_ENDIAN__ 27167 #define vsetq_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 27168 uint64x2_t __ret; \ 27169 uint64_t __s0 = __p0; \ 27170 uint64x2_t __s1 = __p1; \ 27171 __ret = (uint64x2_t) __builtin_neon_vsetq_lane_i64(__s0, (int64x2_t)__s1, __p2); \ 27172 __ret; \ 27173 }) 27174 #else 27175 #define vsetq_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 27176 uint64x2_t __ret; \ 27177 uint64_t __s0 = __p0; \ 27178 uint64x2_t __s1 = __p1; \ 27179 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 27180 __ret = (uint64x2_t) __builtin_neon_vsetq_lane_i64(__s0, (int64x2_t)__rev1, __p2); \ 27181 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 27182 __ret; \ 27183 }) 27184 #define __noswap_vsetq_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 27185 uint64x2_t __ret; \ 27186 uint64_t __s0 = __p0; \ 27187 uint64x2_t __s1 = __p1; \ 27188 __ret = (uint64x2_t) __builtin_neon_vsetq_lane_i64(__s0, (int64x2_t)__s1, __p2); \ 27189 __ret; \ 27190 }) 27191 #endif 27192 27193 #ifdef __LITTLE_ENDIAN__ 27194 #define vsetq_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 27195 uint16x8_t __ret; \ 27196 uint16_t __s0 = __p0; \ 27197 uint16x8_t __s1 = __p1; \ 27198 __ret = (uint16x8_t) __builtin_neon_vsetq_lane_i16(__s0, (int16x8_t)__s1, __p2); \ 27199 __ret; \ 27200 }) 27201 #else 27202 #define vsetq_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 27203 uint16x8_t __ret; \ 27204 uint16_t __s0 = __p0; \ 27205 uint16x8_t __s1 = __p1; \ 27206 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 27207 __ret = (uint16x8_t) __builtin_neon_vsetq_lane_i16(__s0, (int16x8_t)__rev1, __p2); \ 27208 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 27209 __ret; \ 27210 }) 27211 #define __noswap_vsetq_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 27212 uint16x8_t __ret; \ 27213 uint16_t __s0 = __p0; \ 27214 uint16x8_t __s1 = __p1; \ 27215 __ret = (uint16x8_t) __builtin_neon_vsetq_lane_i16(__s0, (int16x8_t)__s1, __p2); \ 27216 __ret; \ 27217 }) 27218 #endif 27219 27220 #ifdef __LITTLE_ENDIAN__ 27221 #define vsetq_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 27222 int8x16_t __ret; \ 27223 int8_t __s0 = __p0; \ 27224 int8x16_t __s1 = __p1; \ 27225 __ret = (int8x16_t) __builtin_neon_vsetq_lane_i8(__s0, (int8x16_t)__s1, __p2); \ 27226 __ret; \ 27227 }) 27228 #else 27229 #define vsetq_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 27230 int8x16_t __ret; \ 27231 int8_t __s0 = __p0; \ 27232 int8x16_t __s1 = __p1; \ 27233 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 27234 __ret = (int8x16_t) __builtin_neon_vsetq_lane_i8(__s0, (int8x16_t)__rev1, __p2); \ 27235 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 27236 __ret; \ 27237 }) 27238 #define __noswap_vsetq_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 27239 int8x16_t __ret; \ 27240 int8_t __s0 = __p0; \ 27241 int8x16_t __s1 = __p1; \ 27242 __ret = (int8x16_t) __builtin_neon_vsetq_lane_i8(__s0, (int8x16_t)__s1, __p2); \ 27243 __ret; \ 27244 }) 27245 #endif 27246 27247 #ifdef __LITTLE_ENDIAN__ 27248 #define vsetq_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 27249 float32x4_t __ret; \ 27250 float32_t __s0 = __p0; \ 27251 float32x4_t __s1 = __p1; \ 27252 __ret = (float32x4_t) __builtin_neon_vsetq_lane_f32(__s0, (float32x4_t)__s1, __p2); \ 27253 __ret; \ 27254 }) 27255 #else 27256 #define vsetq_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 27257 float32x4_t __ret; \ 27258 float32_t __s0 = __p0; \ 27259 float32x4_t __s1 = __p1; \ 27260 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 27261 __ret = (float32x4_t) __builtin_neon_vsetq_lane_f32(__s0, (float32x4_t)__rev1, __p2); \ 27262 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 27263 __ret; \ 27264 }) 27265 #define __noswap_vsetq_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 27266 float32x4_t __ret; \ 27267 float32_t __s0 = __p0; \ 27268 float32x4_t __s1 = __p1; \ 27269 __ret = (float32x4_t) __builtin_neon_vsetq_lane_f32(__s0, (float32x4_t)__s1, __p2); \ 27270 __ret; \ 27271 }) 27272 #endif 27273 27274 #ifdef __LITTLE_ENDIAN__ 27275 #define vsetq_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 27276 int32x4_t __ret; \ 27277 int32_t __s0 = __p0; \ 27278 int32x4_t __s1 = __p1; \ 27279 __ret = (int32x4_t) __builtin_neon_vsetq_lane_i32(__s0, (int32x4_t)__s1, __p2); \ 27280 __ret; \ 27281 }) 27282 #else 27283 #define vsetq_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 27284 int32x4_t __ret; \ 27285 int32_t __s0 = __p0; \ 27286 int32x4_t __s1 = __p1; \ 27287 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 27288 __ret = (int32x4_t) __builtin_neon_vsetq_lane_i32(__s0, (int32x4_t)__rev1, __p2); \ 27289 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 27290 __ret; \ 27291 }) 27292 #define __noswap_vsetq_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 27293 int32x4_t __ret; \ 27294 int32_t __s0 = __p0; \ 27295 int32x4_t __s1 = __p1; \ 27296 __ret = (int32x4_t) __builtin_neon_vsetq_lane_i32(__s0, (int32x4_t)__s1, __p2); \ 27297 __ret; \ 27298 }) 27299 #endif 27300 27301 #ifdef __LITTLE_ENDIAN__ 27302 #define vsetq_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 27303 int64x2_t __ret; \ 27304 int64_t __s0 = __p0; \ 27305 int64x2_t __s1 = __p1; \ 27306 __ret = (int64x2_t) __builtin_neon_vsetq_lane_i64(__s0, (int64x2_t)__s1, __p2); \ 27307 __ret; \ 27308 }) 27309 #else 27310 #define vsetq_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 27311 int64x2_t __ret; \ 27312 int64_t __s0 = __p0; \ 27313 int64x2_t __s1 = __p1; \ 27314 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 27315 __ret = (int64x2_t) __builtin_neon_vsetq_lane_i64(__s0, (int64x2_t)__rev1, __p2); \ 27316 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 27317 __ret; \ 27318 }) 27319 #define __noswap_vsetq_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 27320 int64x2_t __ret; \ 27321 int64_t __s0 = __p0; \ 27322 int64x2_t __s1 = __p1; \ 27323 __ret = (int64x2_t) __builtin_neon_vsetq_lane_i64(__s0, (int64x2_t)__s1, __p2); \ 27324 __ret; \ 27325 }) 27326 #endif 27327 27328 #ifdef __LITTLE_ENDIAN__ 27329 #define vsetq_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 27330 int16x8_t __ret; \ 27331 int16_t __s0 = __p0; \ 27332 int16x8_t __s1 = __p1; \ 27333 __ret = (int16x8_t) __builtin_neon_vsetq_lane_i16(__s0, (int16x8_t)__s1, __p2); \ 27334 __ret; \ 27335 }) 27336 #else 27337 #define vsetq_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 27338 int16x8_t __ret; \ 27339 int16_t __s0 = __p0; \ 27340 int16x8_t __s1 = __p1; \ 27341 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 27342 __ret = (int16x8_t) __builtin_neon_vsetq_lane_i16(__s0, (int16x8_t)__rev1, __p2); \ 27343 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 27344 __ret; \ 27345 }) 27346 #define __noswap_vsetq_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 27347 int16x8_t __ret; \ 27348 int16_t __s0 = __p0; \ 27349 int16x8_t __s1 = __p1; \ 27350 __ret = (int16x8_t) __builtin_neon_vsetq_lane_i16(__s0, (int16x8_t)__s1, __p2); \ 27351 __ret; \ 27352 }) 27353 #endif 27354 27355 #ifdef __LITTLE_ENDIAN__ 27356 #define vset_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 27357 uint8x8_t __ret; \ 27358 uint8_t __s0 = __p0; \ 27359 uint8x8_t __s1 = __p1; \ 27360 __ret = (uint8x8_t) __builtin_neon_vset_lane_i8(__s0, (int8x8_t)__s1, __p2); \ 27361 __ret; \ 27362 }) 27363 #else 27364 #define vset_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 27365 uint8x8_t __ret; \ 27366 uint8_t __s0 = __p0; \ 27367 uint8x8_t __s1 = __p1; \ 27368 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 27369 __ret = (uint8x8_t) __builtin_neon_vset_lane_i8(__s0, (int8x8_t)__rev1, __p2); \ 27370 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 27371 __ret; \ 27372 }) 27373 #define __noswap_vset_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 27374 uint8x8_t __ret; \ 27375 uint8_t __s0 = __p0; \ 27376 uint8x8_t __s1 = __p1; \ 27377 __ret = (uint8x8_t) __builtin_neon_vset_lane_i8(__s0, (int8x8_t)__s1, __p2); \ 27378 __ret; \ 27379 }) 27380 #endif 27381 27382 #ifdef __LITTLE_ENDIAN__ 27383 #define vset_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 27384 uint32x2_t __ret; \ 27385 uint32_t __s0 = __p0; \ 27386 uint32x2_t __s1 = __p1; \ 27387 __ret = (uint32x2_t) __builtin_neon_vset_lane_i32(__s0, (int32x2_t)__s1, __p2); \ 27388 __ret; \ 27389 }) 27390 #else 27391 #define vset_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 27392 uint32x2_t __ret; \ 27393 uint32_t __s0 = __p0; \ 27394 uint32x2_t __s1 = __p1; \ 27395 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 27396 __ret = (uint32x2_t) __builtin_neon_vset_lane_i32(__s0, (int32x2_t)__rev1, __p2); \ 27397 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 27398 __ret; \ 27399 }) 27400 #define __noswap_vset_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 27401 uint32x2_t __ret; \ 27402 uint32_t __s0 = __p0; \ 27403 uint32x2_t __s1 = __p1; \ 27404 __ret = (uint32x2_t) __builtin_neon_vset_lane_i32(__s0, (int32x2_t)__s1, __p2); \ 27405 __ret; \ 27406 }) 27407 #endif 27408 27409 #define vset_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 27410 uint64x1_t __ret; \ 27411 uint64_t __s0 = __p0; \ 27412 uint64x1_t __s1 = __p1; \ 27413 __ret = (uint64x1_t) __builtin_neon_vset_lane_i64(__s0, (int64x1_t)__s1, __p2); \ 27414 __ret; \ 27415 }) 27416 #ifdef __LITTLE_ENDIAN__ 27417 #define vset_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 27418 uint16x4_t __ret; \ 27419 uint16_t __s0 = __p0; \ 27420 uint16x4_t __s1 = __p1; \ 27421 __ret = (uint16x4_t) __builtin_neon_vset_lane_i16(__s0, (int16x4_t)__s1, __p2); \ 27422 __ret; \ 27423 }) 27424 #else 27425 #define vset_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 27426 uint16x4_t __ret; \ 27427 uint16_t __s0 = __p0; \ 27428 uint16x4_t __s1 = __p1; \ 27429 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 27430 __ret = (uint16x4_t) __builtin_neon_vset_lane_i16(__s0, (int16x4_t)__rev1, __p2); \ 27431 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 27432 __ret; \ 27433 }) 27434 #define __noswap_vset_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 27435 uint16x4_t __ret; \ 27436 uint16_t __s0 = __p0; \ 27437 uint16x4_t __s1 = __p1; \ 27438 __ret = (uint16x4_t) __builtin_neon_vset_lane_i16(__s0, (int16x4_t)__s1, __p2); \ 27439 __ret; \ 27440 }) 27441 #endif 27442 27443 #ifdef __LITTLE_ENDIAN__ 27444 #define vset_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 27445 int8x8_t __ret; \ 27446 int8_t __s0 = __p0; \ 27447 int8x8_t __s1 = __p1; \ 27448 __ret = (int8x8_t) __builtin_neon_vset_lane_i8(__s0, (int8x8_t)__s1, __p2); \ 27449 __ret; \ 27450 }) 27451 #else 27452 #define vset_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 27453 int8x8_t __ret; \ 27454 int8_t __s0 = __p0; \ 27455 int8x8_t __s1 = __p1; \ 27456 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 27457 __ret = (int8x8_t) __builtin_neon_vset_lane_i8(__s0, (int8x8_t)__rev1, __p2); \ 27458 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 27459 __ret; \ 27460 }) 27461 #define __noswap_vset_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 27462 int8x8_t __ret; \ 27463 int8_t __s0 = __p0; \ 27464 int8x8_t __s1 = __p1; \ 27465 __ret = (int8x8_t) __builtin_neon_vset_lane_i8(__s0, (int8x8_t)__s1, __p2); \ 27466 __ret; \ 27467 }) 27468 #endif 27469 27470 #ifdef __LITTLE_ENDIAN__ 27471 #define vset_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 27472 float32x2_t __ret; \ 27473 float32_t __s0 = __p0; \ 27474 float32x2_t __s1 = __p1; \ 27475 __ret = (float32x2_t) __builtin_neon_vset_lane_f32(__s0, (float32x2_t)__s1, __p2); \ 27476 __ret; \ 27477 }) 27478 #else 27479 #define vset_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 27480 float32x2_t __ret; \ 27481 float32_t __s0 = __p0; \ 27482 float32x2_t __s1 = __p1; \ 27483 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 27484 __ret = (float32x2_t) __builtin_neon_vset_lane_f32(__s0, (float32x2_t)__rev1, __p2); \ 27485 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 27486 __ret; \ 27487 }) 27488 #define __noswap_vset_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 27489 float32x2_t __ret; \ 27490 float32_t __s0 = __p0; \ 27491 float32x2_t __s1 = __p1; \ 27492 __ret = (float32x2_t) __builtin_neon_vset_lane_f32(__s0, (float32x2_t)__s1, __p2); \ 27493 __ret; \ 27494 }) 27495 #endif 27496 27497 #ifdef __LITTLE_ENDIAN__ 27498 #define vset_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 27499 int32x2_t __ret; \ 27500 int32_t __s0 = __p0; \ 27501 int32x2_t __s1 = __p1; \ 27502 __ret = (int32x2_t) __builtin_neon_vset_lane_i32(__s0, (int32x2_t)__s1, __p2); \ 27503 __ret; \ 27504 }) 27505 #else 27506 #define vset_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 27507 int32x2_t __ret; \ 27508 int32_t __s0 = __p0; \ 27509 int32x2_t __s1 = __p1; \ 27510 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 27511 __ret = (int32x2_t) __builtin_neon_vset_lane_i32(__s0, (int32x2_t)__rev1, __p2); \ 27512 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 27513 __ret; \ 27514 }) 27515 #define __noswap_vset_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 27516 int32x2_t __ret; \ 27517 int32_t __s0 = __p0; \ 27518 int32x2_t __s1 = __p1; \ 27519 __ret = (int32x2_t) __builtin_neon_vset_lane_i32(__s0, (int32x2_t)__s1, __p2); \ 27520 __ret; \ 27521 }) 27522 #endif 27523 27524 #define vset_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 27525 int64x1_t __ret; \ 27526 int64_t __s0 = __p0; \ 27527 int64x1_t __s1 = __p1; \ 27528 __ret = (int64x1_t) __builtin_neon_vset_lane_i64(__s0, (int64x1_t)__s1, __p2); \ 27529 __ret; \ 27530 }) 27531 #ifdef __LITTLE_ENDIAN__ 27532 #define vset_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 27533 int16x4_t __ret; \ 27534 int16_t __s0 = __p0; \ 27535 int16x4_t __s1 = __p1; \ 27536 __ret = (int16x4_t) __builtin_neon_vset_lane_i16(__s0, (int16x4_t)__s1, __p2); \ 27537 __ret; \ 27538 }) 27539 #else 27540 #define vset_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 27541 int16x4_t __ret; \ 27542 int16_t __s0 = __p0; \ 27543 int16x4_t __s1 = __p1; \ 27544 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 27545 __ret = (int16x4_t) __builtin_neon_vset_lane_i16(__s0, (int16x4_t)__rev1, __p2); \ 27546 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 27547 __ret; \ 27548 }) 27549 #define __noswap_vset_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 27550 int16x4_t __ret; \ 27551 int16_t __s0 = __p0; \ 27552 int16x4_t __s1 = __p1; \ 27553 __ret = (int16x4_t) __builtin_neon_vset_lane_i16(__s0, (int16x4_t)__s1, __p2); \ 27554 __ret; \ 27555 }) 27556 #endif 27557 27558 #ifdef __LITTLE_ENDIAN__ 27559 __ai __attribute__((target("neon"))) uint8x16_t vshlq_u8(uint8x16_t __p0, int8x16_t __p1) { 27560 uint8x16_t __ret; 27561 __ret = (uint8x16_t) __builtin_neon_vshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 48); 27562 return __ret; 27563 } 27564 #else 27565 __ai __attribute__((target("neon"))) uint8x16_t vshlq_u8(uint8x16_t __p0, int8x16_t __p1) { 27566 uint8x16_t __ret; 27567 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 27568 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 27569 __ret = (uint8x16_t) __builtin_neon_vshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48); 27570 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 27571 return __ret; 27572 } 27573 #endif 27574 27575 #ifdef __LITTLE_ENDIAN__ 27576 __ai __attribute__((target("neon"))) uint32x4_t vshlq_u32(uint32x4_t __p0, int32x4_t __p1) { 27577 uint32x4_t __ret; 27578 __ret = (uint32x4_t) __builtin_neon_vshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 50); 27579 return __ret; 27580 } 27581 #else 27582 __ai __attribute__((target("neon"))) uint32x4_t vshlq_u32(uint32x4_t __p0, int32x4_t __p1) { 27583 uint32x4_t __ret; 27584 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 27585 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 27586 __ret = (uint32x4_t) __builtin_neon_vshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50); 27587 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 27588 return __ret; 27589 } 27590 #endif 27591 27592 #ifdef __LITTLE_ENDIAN__ 27593 __ai __attribute__((target("neon"))) uint64x2_t vshlq_u64(uint64x2_t __p0, int64x2_t __p1) { 27594 uint64x2_t __ret; 27595 __ret = (uint64x2_t) __builtin_neon_vshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 51); 27596 return __ret; 27597 } 27598 #else 27599 __ai __attribute__((target("neon"))) uint64x2_t vshlq_u64(uint64x2_t __p0, int64x2_t __p1) { 27600 uint64x2_t __ret; 27601 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 27602 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 27603 __ret = (uint64x2_t) __builtin_neon_vshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 51); 27604 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 27605 return __ret; 27606 } 27607 #endif 27608 27609 #ifdef __LITTLE_ENDIAN__ 27610 __ai __attribute__((target("neon"))) uint16x8_t vshlq_u16(uint16x8_t __p0, int16x8_t __p1) { 27611 uint16x8_t __ret; 27612 __ret = (uint16x8_t) __builtin_neon_vshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 49); 27613 return __ret; 27614 } 27615 #else 27616 __ai __attribute__((target("neon"))) uint16x8_t vshlq_u16(uint16x8_t __p0, int16x8_t __p1) { 27617 uint16x8_t __ret; 27618 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 27619 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 27620 __ret = (uint16x8_t) __builtin_neon_vshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49); 27621 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 27622 return __ret; 27623 } 27624 #endif 27625 27626 #ifdef __LITTLE_ENDIAN__ 27627 __ai __attribute__((target("neon"))) int8x16_t vshlq_s8(int8x16_t __p0, int8x16_t __p1) { 27628 int8x16_t __ret; 27629 __ret = (int8x16_t) __builtin_neon_vshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 32); 27630 return __ret; 27631 } 27632 #else 27633 __ai __attribute__((target("neon"))) int8x16_t vshlq_s8(int8x16_t __p0, int8x16_t __p1) { 27634 int8x16_t __ret; 27635 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 27636 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 27637 __ret = (int8x16_t) __builtin_neon_vshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32); 27638 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 27639 return __ret; 27640 } 27641 #endif 27642 27643 #ifdef __LITTLE_ENDIAN__ 27644 __ai __attribute__((target("neon"))) int32x4_t vshlq_s32(int32x4_t __p0, int32x4_t __p1) { 27645 int32x4_t __ret; 27646 __ret = (int32x4_t) __builtin_neon_vshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 34); 27647 return __ret; 27648 } 27649 #else 27650 __ai __attribute__((target("neon"))) int32x4_t vshlq_s32(int32x4_t __p0, int32x4_t __p1) { 27651 int32x4_t __ret; 27652 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 27653 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 27654 __ret = (int32x4_t) __builtin_neon_vshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34); 27655 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 27656 return __ret; 27657 } 27658 #endif 27659 27660 #ifdef __LITTLE_ENDIAN__ 27661 __ai __attribute__((target("neon"))) int64x2_t vshlq_s64(int64x2_t __p0, int64x2_t __p1) { 27662 int64x2_t __ret; 27663 __ret = (int64x2_t) __builtin_neon_vshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 35); 27664 return __ret; 27665 } 27666 #else 27667 __ai __attribute__((target("neon"))) int64x2_t vshlq_s64(int64x2_t __p0, int64x2_t __p1) { 27668 int64x2_t __ret; 27669 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 27670 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 27671 __ret = (int64x2_t) __builtin_neon_vshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 35); 27672 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 27673 return __ret; 27674 } 27675 #endif 27676 27677 #ifdef __LITTLE_ENDIAN__ 27678 __ai __attribute__((target("neon"))) int16x8_t vshlq_s16(int16x8_t __p0, int16x8_t __p1) { 27679 int16x8_t __ret; 27680 __ret = (int16x8_t) __builtin_neon_vshlq_v((int8x16_t)__p0, (int8x16_t)__p1, 33); 27681 return __ret; 27682 } 27683 #else 27684 __ai __attribute__((target("neon"))) int16x8_t vshlq_s16(int16x8_t __p0, int16x8_t __p1) { 27685 int16x8_t __ret; 27686 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 27687 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 27688 __ret = (int16x8_t) __builtin_neon_vshlq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33); 27689 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 27690 return __ret; 27691 } 27692 #endif 27693 27694 #ifdef __LITTLE_ENDIAN__ 27695 __ai __attribute__((target("neon"))) uint8x8_t vshl_u8(uint8x8_t __p0, int8x8_t __p1) { 27696 uint8x8_t __ret; 27697 __ret = (uint8x8_t) __builtin_neon_vshl_v((int8x8_t)__p0, (int8x8_t)__p1, 16); 27698 return __ret; 27699 } 27700 #else 27701 __ai __attribute__((target("neon"))) uint8x8_t vshl_u8(uint8x8_t __p0, int8x8_t __p1) { 27702 uint8x8_t __ret; 27703 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 27704 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 27705 __ret = (uint8x8_t) __builtin_neon_vshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16); 27706 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 27707 return __ret; 27708 } 27709 #endif 27710 27711 #ifdef __LITTLE_ENDIAN__ 27712 __ai __attribute__((target("neon"))) uint32x2_t vshl_u32(uint32x2_t __p0, int32x2_t __p1) { 27713 uint32x2_t __ret; 27714 __ret = (uint32x2_t) __builtin_neon_vshl_v((int8x8_t)__p0, (int8x8_t)__p1, 18); 27715 return __ret; 27716 } 27717 #else 27718 __ai __attribute__((target("neon"))) uint32x2_t vshl_u32(uint32x2_t __p0, int32x2_t __p1) { 27719 uint32x2_t __ret; 27720 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 27721 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 27722 __ret = (uint32x2_t) __builtin_neon_vshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18); 27723 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 27724 return __ret; 27725 } 27726 #endif 27727 27728 __ai __attribute__((target("neon"))) uint64x1_t vshl_u64(uint64x1_t __p0, int64x1_t __p1) { 27729 uint64x1_t __ret; 27730 __ret = (uint64x1_t) __builtin_neon_vshl_v((int8x8_t)__p0, (int8x8_t)__p1, 19); 27731 return __ret; 27732 } 27733 #ifdef __LITTLE_ENDIAN__ 27734 __ai __attribute__((target("neon"))) uint16x4_t vshl_u16(uint16x4_t __p0, int16x4_t __p1) { 27735 uint16x4_t __ret; 27736 __ret = (uint16x4_t) __builtin_neon_vshl_v((int8x8_t)__p0, (int8x8_t)__p1, 17); 27737 return __ret; 27738 } 27739 #else 27740 __ai __attribute__((target("neon"))) uint16x4_t vshl_u16(uint16x4_t __p0, int16x4_t __p1) { 27741 uint16x4_t __ret; 27742 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 27743 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 27744 __ret = (uint16x4_t) __builtin_neon_vshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17); 27745 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 27746 return __ret; 27747 } 27748 #endif 27749 27750 #ifdef __LITTLE_ENDIAN__ 27751 __ai __attribute__((target("neon"))) int8x8_t vshl_s8(int8x8_t __p0, int8x8_t __p1) { 27752 int8x8_t __ret; 27753 __ret = (int8x8_t) __builtin_neon_vshl_v((int8x8_t)__p0, (int8x8_t)__p1, 0); 27754 return __ret; 27755 } 27756 #else 27757 __ai __attribute__((target("neon"))) int8x8_t vshl_s8(int8x8_t __p0, int8x8_t __p1) { 27758 int8x8_t __ret; 27759 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 27760 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 27761 __ret = (int8x8_t) __builtin_neon_vshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0); 27762 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 27763 return __ret; 27764 } 27765 #endif 27766 27767 #ifdef __LITTLE_ENDIAN__ 27768 __ai __attribute__((target("neon"))) int32x2_t vshl_s32(int32x2_t __p0, int32x2_t __p1) { 27769 int32x2_t __ret; 27770 __ret = (int32x2_t) __builtin_neon_vshl_v((int8x8_t)__p0, (int8x8_t)__p1, 2); 27771 return __ret; 27772 } 27773 #else 27774 __ai __attribute__((target("neon"))) int32x2_t vshl_s32(int32x2_t __p0, int32x2_t __p1) { 27775 int32x2_t __ret; 27776 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 27777 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 27778 __ret = (int32x2_t) __builtin_neon_vshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2); 27779 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 27780 return __ret; 27781 } 27782 #endif 27783 27784 __ai __attribute__((target("neon"))) int64x1_t vshl_s64(int64x1_t __p0, int64x1_t __p1) { 27785 int64x1_t __ret; 27786 __ret = (int64x1_t) __builtin_neon_vshl_v((int8x8_t)__p0, (int8x8_t)__p1, 3); 27787 return __ret; 27788 } 27789 #ifdef __LITTLE_ENDIAN__ 27790 __ai __attribute__((target("neon"))) int16x4_t vshl_s16(int16x4_t __p0, int16x4_t __p1) { 27791 int16x4_t __ret; 27792 __ret = (int16x4_t) __builtin_neon_vshl_v((int8x8_t)__p0, (int8x8_t)__p1, 1); 27793 return __ret; 27794 } 27795 #else 27796 __ai __attribute__((target("neon"))) int16x4_t vshl_s16(int16x4_t __p0, int16x4_t __p1) { 27797 int16x4_t __ret; 27798 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 27799 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 27800 __ret = (int16x4_t) __builtin_neon_vshl_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1); 27801 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 27802 return __ret; 27803 } 27804 #endif 27805 27806 #ifdef __LITTLE_ENDIAN__ 27807 #define vshlq_n_u8(__p0, __p1) __extension__ ({ \ 27808 uint8x16_t __ret; \ 27809 uint8x16_t __s0 = __p0; \ 27810 __ret = (uint8x16_t) __builtin_neon_vshlq_n_v((int8x16_t)__s0, __p1, 48); \ 27811 __ret; \ 27812 }) 27813 #else 27814 #define vshlq_n_u8(__p0, __p1) __extension__ ({ \ 27815 uint8x16_t __ret; \ 27816 uint8x16_t __s0 = __p0; \ 27817 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 27818 __ret = (uint8x16_t) __builtin_neon_vshlq_n_v((int8x16_t)__rev0, __p1, 48); \ 27819 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 27820 __ret; \ 27821 }) 27822 #endif 27823 27824 #ifdef __LITTLE_ENDIAN__ 27825 #define vshlq_n_u32(__p0, __p1) __extension__ ({ \ 27826 uint32x4_t __ret; \ 27827 uint32x4_t __s0 = __p0; \ 27828 __ret = (uint32x4_t) __builtin_neon_vshlq_n_v((int8x16_t)__s0, __p1, 50); \ 27829 __ret; \ 27830 }) 27831 #else 27832 #define vshlq_n_u32(__p0, __p1) __extension__ ({ \ 27833 uint32x4_t __ret; \ 27834 uint32x4_t __s0 = __p0; \ 27835 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 27836 __ret = (uint32x4_t) __builtin_neon_vshlq_n_v((int8x16_t)__rev0, __p1, 50); \ 27837 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 27838 __ret; \ 27839 }) 27840 #endif 27841 27842 #ifdef __LITTLE_ENDIAN__ 27843 #define vshlq_n_u64(__p0, __p1) __extension__ ({ \ 27844 uint64x2_t __ret; \ 27845 uint64x2_t __s0 = __p0; \ 27846 __ret = (uint64x2_t) __builtin_neon_vshlq_n_v((int8x16_t)__s0, __p1, 51); \ 27847 __ret; \ 27848 }) 27849 #else 27850 #define vshlq_n_u64(__p0, __p1) __extension__ ({ \ 27851 uint64x2_t __ret; \ 27852 uint64x2_t __s0 = __p0; \ 27853 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 27854 __ret = (uint64x2_t) __builtin_neon_vshlq_n_v((int8x16_t)__rev0, __p1, 51); \ 27855 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 27856 __ret; \ 27857 }) 27858 #endif 27859 27860 #ifdef __LITTLE_ENDIAN__ 27861 #define vshlq_n_u16(__p0, __p1) __extension__ ({ \ 27862 uint16x8_t __ret; \ 27863 uint16x8_t __s0 = __p0; \ 27864 __ret = (uint16x8_t) __builtin_neon_vshlq_n_v((int8x16_t)__s0, __p1, 49); \ 27865 __ret; \ 27866 }) 27867 #else 27868 #define vshlq_n_u16(__p0, __p1) __extension__ ({ \ 27869 uint16x8_t __ret; \ 27870 uint16x8_t __s0 = __p0; \ 27871 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 27872 __ret = (uint16x8_t) __builtin_neon_vshlq_n_v((int8x16_t)__rev0, __p1, 49); \ 27873 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 27874 __ret; \ 27875 }) 27876 #endif 27877 27878 #ifdef __LITTLE_ENDIAN__ 27879 #define vshlq_n_s8(__p0, __p1) __extension__ ({ \ 27880 int8x16_t __ret; \ 27881 int8x16_t __s0 = __p0; \ 27882 __ret = (int8x16_t) __builtin_neon_vshlq_n_v((int8x16_t)__s0, __p1, 32); \ 27883 __ret; \ 27884 }) 27885 #else 27886 #define vshlq_n_s8(__p0, __p1) __extension__ ({ \ 27887 int8x16_t __ret; \ 27888 int8x16_t __s0 = __p0; \ 27889 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 27890 __ret = (int8x16_t) __builtin_neon_vshlq_n_v((int8x16_t)__rev0, __p1, 32); \ 27891 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 27892 __ret; \ 27893 }) 27894 #endif 27895 27896 #ifdef __LITTLE_ENDIAN__ 27897 #define vshlq_n_s32(__p0, __p1) __extension__ ({ \ 27898 int32x4_t __ret; \ 27899 int32x4_t __s0 = __p0; \ 27900 __ret = (int32x4_t) __builtin_neon_vshlq_n_v((int8x16_t)__s0, __p1, 34); \ 27901 __ret; \ 27902 }) 27903 #else 27904 #define vshlq_n_s32(__p0, __p1) __extension__ ({ \ 27905 int32x4_t __ret; \ 27906 int32x4_t __s0 = __p0; \ 27907 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 27908 __ret = (int32x4_t) __builtin_neon_vshlq_n_v((int8x16_t)__rev0, __p1, 34); \ 27909 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 27910 __ret; \ 27911 }) 27912 #endif 27913 27914 #ifdef __LITTLE_ENDIAN__ 27915 #define vshlq_n_s64(__p0, __p1) __extension__ ({ \ 27916 int64x2_t __ret; \ 27917 int64x2_t __s0 = __p0; \ 27918 __ret = (int64x2_t) __builtin_neon_vshlq_n_v((int8x16_t)__s0, __p1, 35); \ 27919 __ret; \ 27920 }) 27921 #else 27922 #define vshlq_n_s64(__p0, __p1) __extension__ ({ \ 27923 int64x2_t __ret; \ 27924 int64x2_t __s0 = __p0; \ 27925 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 27926 __ret = (int64x2_t) __builtin_neon_vshlq_n_v((int8x16_t)__rev0, __p1, 35); \ 27927 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 27928 __ret; \ 27929 }) 27930 #endif 27931 27932 #ifdef __LITTLE_ENDIAN__ 27933 #define vshlq_n_s16(__p0, __p1) __extension__ ({ \ 27934 int16x8_t __ret; \ 27935 int16x8_t __s0 = __p0; \ 27936 __ret = (int16x8_t) __builtin_neon_vshlq_n_v((int8x16_t)__s0, __p1, 33); \ 27937 __ret; \ 27938 }) 27939 #else 27940 #define vshlq_n_s16(__p0, __p1) __extension__ ({ \ 27941 int16x8_t __ret; \ 27942 int16x8_t __s0 = __p0; \ 27943 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 27944 __ret = (int16x8_t) __builtin_neon_vshlq_n_v((int8x16_t)__rev0, __p1, 33); \ 27945 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 27946 __ret; \ 27947 }) 27948 #endif 27949 27950 #ifdef __LITTLE_ENDIAN__ 27951 #define vshl_n_u8(__p0, __p1) __extension__ ({ \ 27952 uint8x8_t __ret; \ 27953 uint8x8_t __s0 = __p0; \ 27954 __ret = (uint8x8_t) __builtin_neon_vshl_n_v((int8x8_t)__s0, __p1, 16); \ 27955 __ret; \ 27956 }) 27957 #else 27958 #define vshl_n_u8(__p0, __p1) __extension__ ({ \ 27959 uint8x8_t __ret; \ 27960 uint8x8_t __s0 = __p0; \ 27961 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 27962 __ret = (uint8x8_t) __builtin_neon_vshl_n_v((int8x8_t)__rev0, __p1, 16); \ 27963 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 27964 __ret; \ 27965 }) 27966 #endif 27967 27968 #ifdef __LITTLE_ENDIAN__ 27969 #define vshl_n_u32(__p0, __p1) __extension__ ({ \ 27970 uint32x2_t __ret; \ 27971 uint32x2_t __s0 = __p0; \ 27972 __ret = (uint32x2_t) __builtin_neon_vshl_n_v((int8x8_t)__s0, __p1, 18); \ 27973 __ret; \ 27974 }) 27975 #else 27976 #define vshl_n_u32(__p0, __p1) __extension__ ({ \ 27977 uint32x2_t __ret; \ 27978 uint32x2_t __s0 = __p0; \ 27979 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 27980 __ret = (uint32x2_t) __builtin_neon_vshl_n_v((int8x8_t)__rev0, __p1, 18); \ 27981 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 27982 __ret; \ 27983 }) 27984 #endif 27985 27986 #define vshl_n_u64(__p0, __p1) __extension__ ({ \ 27987 uint64x1_t __ret; \ 27988 uint64x1_t __s0 = __p0; \ 27989 __ret = (uint64x1_t) __builtin_neon_vshl_n_v((int8x8_t)__s0, __p1, 19); \ 27990 __ret; \ 27991 }) 27992 #ifdef __LITTLE_ENDIAN__ 27993 #define vshl_n_u16(__p0, __p1) __extension__ ({ \ 27994 uint16x4_t __ret; \ 27995 uint16x4_t __s0 = __p0; \ 27996 __ret = (uint16x4_t) __builtin_neon_vshl_n_v((int8x8_t)__s0, __p1, 17); \ 27997 __ret; \ 27998 }) 27999 #else 28000 #define vshl_n_u16(__p0, __p1) __extension__ ({ \ 28001 uint16x4_t __ret; \ 28002 uint16x4_t __s0 = __p0; \ 28003 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 28004 __ret = (uint16x4_t) __builtin_neon_vshl_n_v((int8x8_t)__rev0, __p1, 17); \ 28005 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 28006 __ret; \ 28007 }) 28008 #endif 28009 28010 #ifdef __LITTLE_ENDIAN__ 28011 #define vshl_n_s8(__p0, __p1) __extension__ ({ \ 28012 int8x8_t __ret; \ 28013 int8x8_t __s0 = __p0; \ 28014 __ret = (int8x8_t) __builtin_neon_vshl_n_v((int8x8_t)__s0, __p1, 0); \ 28015 __ret; \ 28016 }) 28017 #else 28018 #define vshl_n_s8(__p0, __p1) __extension__ ({ \ 28019 int8x8_t __ret; \ 28020 int8x8_t __s0 = __p0; \ 28021 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 28022 __ret = (int8x8_t) __builtin_neon_vshl_n_v((int8x8_t)__rev0, __p1, 0); \ 28023 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 28024 __ret; \ 28025 }) 28026 #endif 28027 28028 #ifdef __LITTLE_ENDIAN__ 28029 #define vshl_n_s32(__p0, __p1) __extension__ ({ \ 28030 int32x2_t __ret; \ 28031 int32x2_t __s0 = __p0; \ 28032 __ret = (int32x2_t) __builtin_neon_vshl_n_v((int8x8_t)__s0, __p1, 2); \ 28033 __ret; \ 28034 }) 28035 #else 28036 #define vshl_n_s32(__p0, __p1) __extension__ ({ \ 28037 int32x2_t __ret; \ 28038 int32x2_t __s0 = __p0; \ 28039 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 28040 __ret = (int32x2_t) __builtin_neon_vshl_n_v((int8x8_t)__rev0, __p1, 2); \ 28041 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 28042 __ret; \ 28043 }) 28044 #endif 28045 28046 #define vshl_n_s64(__p0, __p1) __extension__ ({ \ 28047 int64x1_t __ret; \ 28048 int64x1_t __s0 = __p0; \ 28049 __ret = (int64x1_t) __builtin_neon_vshl_n_v((int8x8_t)__s0, __p1, 3); \ 28050 __ret; \ 28051 }) 28052 #ifdef __LITTLE_ENDIAN__ 28053 #define vshl_n_s16(__p0, __p1) __extension__ ({ \ 28054 int16x4_t __ret; \ 28055 int16x4_t __s0 = __p0; \ 28056 __ret = (int16x4_t) __builtin_neon_vshl_n_v((int8x8_t)__s0, __p1, 1); \ 28057 __ret; \ 28058 }) 28059 #else 28060 #define vshl_n_s16(__p0, __p1) __extension__ ({ \ 28061 int16x4_t __ret; \ 28062 int16x4_t __s0 = __p0; \ 28063 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 28064 __ret = (int16x4_t) __builtin_neon_vshl_n_v((int8x8_t)__rev0, __p1, 1); \ 28065 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 28066 __ret; \ 28067 }) 28068 #endif 28069 28070 #ifdef __LITTLE_ENDIAN__ 28071 #define vshll_n_u8(__p0, __p1) __extension__ ({ \ 28072 uint16x8_t __ret; \ 28073 uint8x8_t __s0 = __p0; \ 28074 __ret = (uint16x8_t) __builtin_neon_vshll_n_v((int8x8_t)__s0, __p1, 49); \ 28075 __ret; \ 28076 }) 28077 #else 28078 #define vshll_n_u8(__p0, __p1) __extension__ ({ \ 28079 uint16x8_t __ret; \ 28080 uint8x8_t __s0 = __p0; \ 28081 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 28082 __ret = (uint16x8_t) __builtin_neon_vshll_n_v((int8x8_t)__rev0, __p1, 49); \ 28083 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 28084 __ret; \ 28085 }) 28086 #define __noswap_vshll_n_u8(__p0, __p1) __extension__ ({ \ 28087 uint16x8_t __ret; \ 28088 uint8x8_t __s0 = __p0; \ 28089 __ret = (uint16x8_t) __builtin_neon_vshll_n_v((int8x8_t)__s0, __p1, 49); \ 28090 __ret; \ 28091 }) 28092 #endif 28093 28094 #ifdef __LITTLE_ENDIAN__ 28095 #define vshll_n_u32(__p0, __p1) __extension__ ({ \ 28096 uint64x2_t __ret; \ 28097 uint32x2_t __s0 = __p0; \ 28098 __ret = (uint64x2_t) __builtin_neon_vshll_n_v((int8x8_t)__s0, __p1, 51); \ 28099 __ret; \ 28100 }) 28101 #else 28102 #define vshll_n_u32(__p0, __p1) __extension__ ({ \ 28103 uint64x2_t __ret; \ 28104 uint32x2_t __s0 = __p0; \ 28105 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 28106 __ret = (uint64x2_t) __builtin_neon_vshll_n_v((int8x8_t)__rev0, __p1, 51); \ 28107 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 28108 __ret; \ 28109 }) 28110 #define __noswap_vshll_n_u32(__p0, __p1) __extension__ ({ \ 28111 uint64x2_t __ret; \ 28112 uint32x2_t __s0 = __p0; \ 28113 __ret = (uint64x2_t) __builtin_neon_vshll_n_v((int8x8_t)__s0, __p1, 51); \ 28114 __ret; \ 28115 }) 28116 #endif 28117 28118 #ifdef __LITTLE_ENDIAN__ 28119 #define vshll_n_u16(__p0, __p1) __extension__ ({ \ 28120 uint32x4_t __ret; \ 28121 uint16x4_t __s0 = __p0; \ 28122 __ret = (uint32x4_t) __builtin_neon_vshll_n_v((int8x8_t)__s0, __p1, 50); \ 28123 __ret; \ 28124 }) 28125 #else 28126 #define vshll_n_u16(__p0, __p1) __extension__ ({ \ 28127 uint32x4_t __ret; \ 28128 uint16x4_t __s0 = __p0; \ 28129 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 28130 __ret = (uint32x4_t) __builtin_neon_vshll_n_v((int8x8_t)__rev0, __p1, 50); \ 28131 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 28132 __ret; \ 28133 }) 28134 #define __noswap_vshll_n_u16(__p0, __p1) __extension__ ({ \ 28135 uint32x4_t __ret; \ 28136 uint16x4_t __s0 = __p0; \ 28137 __ret = (uint32x4_t) __builtin_neon_vshll_n_v((int8x8_t)__s0, __p1, 50); \ 28138 __ret; \ 28139 }) 28140 #endif 28141 28142 #ifdef __LITTLE_ENDIAN__ 28143 #define vshll_n_s8(__p0, __p1) __extension__ ({ \ 28144 int16x8_t __ret; \ 28145 int8x8_t __s0 = __p0; \ 28146 __ret = (int16x8_t) __builtin_neon_vshll_n_v((int8x8_t)__s0, __p1, 33); \ 28147 __ret; \ 28148 }) 28149 #else 28150 #define vshll_n_s8(__p0, __p1) __extension__ ({ \ 28151 int16x8_t __ret; \ 28152 int8x8_t __s0 = __p0; \ 28153 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 28154 __ret = (int16x8_t) __builtin_neon_vshll_n_v((int8x8_t)__rev0, __p1, 33); \ 28155 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 28156 __ret; \ 28157 }) 28158 #define __noswap_vshll_n_s8(__p0, __p1) __extension__ ({ \ 28159 int16x8_t __ret; \ 28160 int8x8_t __s0 = __p0; \ 28161 __ret = (int16x8_t) __builtin_neon_vshll_n_v((int8x8_t)__s0, __p1, 33); \ 28162 __ret; \ 28163 }) 28164 #endif 28165 28166 #ifdef __LITTLE_ENDIAN__ 28167 #define vshll_n_s32(__p0, __p1) __extension__ ({ \ 28168 int64x2_t __ret; \ 28169 int32x2_t __s0 = __p0; \ 28170 __ret = (int64x2_t) __builtin_neon_vshll_n_v((int8x8_t)__s0, __p1, 35); \ 28171 __ret; \ 28172 }) 28173 #else 28174 #define vshll_n_s32(__p0, __p1) __extension__ ({ \ 28175 int64x2_t __ret; \ 28176 int32x2_t __s0 = __p0; \ 28177 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 28178 __ret = (int64x2_t) __builtin_neon_vshll_n_v((int8x8_t)__rev0, __p1, 35); \ 28179 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 28180 __ret; \ 28181 }) 28182 #define __noswap_vshll_n_s32(__p0, __p1) __extension__ ({ \ 28183 int64x2_t __ret; \ 28184 int32x2_t __s0 = __p0; \ 28185 __ret = (int64x2_t) __builtin_neon_vshll_n_v((int8x8_t)__s0, __p1, 35); \ 28186 __ret; \ 28187 }) 28188 #endif 28189 28190 #ifdef __LITTLE_ENDIAN__ 28191 #define vshll_n_s16(__p0, __p1) __extension__ ({ \ 28192 int32x4_t __ret; \ 28193 int16x4_t __s0 = __p0; \ 28194 __ret = (int32x4_t) __builtin_neon_vshll_n_v((int8x8_t)__s0, __p1, 34); \ 28195 __ret; \ 28196 }) 28197 #else 28198 #define vshll_n_s16(__p0, __p1) __extension__ ({ \ 28199 int32x4_t __ret; \ 28200 int16x4_t __s0 = __p0; \ 28201 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 28202 __ret = (int32x4_t) __builtin_neon_vshll_n_v((int8x8_t)__rev0, __p1, 34); \ 28203 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 28204 __ret; \ 28205 }) 28206 #define __noswap_vshll_n_s16(__p0, __p1) __extension__ ({ \ 28207 int32x4_t __ret; \ 28208 int16x4_t __s0 = __p0; \ 28209 __ret = (int32x4_t) __builtin_neon_vshll_n_v((int8x8_t)__s0, __p1, 34); \ 28210 __ret; \ 28211 }) 28212 #endif 28213 28214 #ifdef __LITTLE_ENDIAN__ 28215 #define vshrq_n_u8(__p0, __p1) __extension__ ({ \ 28216 uint8x16_t __ret; \ 28217 uint8x16_t __s0 = __p0; \ 28218 __ret = (uint8x16_t) __builtin_neon_vshrq_n_v((int8x16_t)__s0, __p1, 48); \ 28219 __ret; \ 28220 }) 28221 #else 28222 #define vshrq_n_u8(__p0, __p1) __extension__ ({ \ 28223 uint8x16_t __ret; \ 28224 uint8x16_t __s0 = __p0; \ 28225 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 28226 __ret = (uint8x16_t) __builtin_neon_vshrq_n_v((int8x16_t)__rev0, __p1, 48); \ 28227 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 28228 __ret; \ 28229 }) 28230 #endif 28231 28232 #ifdef __LITTLE_ENDIAN__ 28233 #define vshrq_n_u32(__p0, __p1) __extension__ ({ \ 28234 uint32x4_t __ret; \ 28235 uint32x4_t __s0 = __p0; \ 28236 __ret = (uint32x4_t) __builtin_neon_vshrq_n_v((int8x16_t)__s0, __p1, 50); \ 28237 __ret; \ 28238 }) 28239 #else 28240 #define vshrq_n_u32(__p0, __p1) __extension__ ({ \ 28241 uint32x4_t __ret; \ 28242 uint32x4_t __s0 = __p0; \ 28243 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 28244 __ret = (uint32x4_t) __builtin_neon_vshrq_n_v((int8x16_t)__rev0, __p1, 50); \ 28245 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 28246 __ret; \ 28247 }) 28248 #endif 28249 28250 #ifdef __LITTLE_ENDIAN__ 28251 #define vshrq_n_u64(__p0, __p1) __extension__ ({ \ 28252 uint64x2_t __ret; \ 28253 uint64x2_t __s0 = __p0; \ 28254 __ret = (uint64x2_t) __builtin_neon_vshrq_n_v((int8x16_t)__s0, __p1, 51); \ 28255 __ret; \ 28256 }) 28257 #else 28258 #define vshrq_n_u64(__p0, __p1) __extension__ ({ \ 28259 uint64x2_t __ret; \ 28260 uint64x2_t __s0 = __p0; \ 28261 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 28262 __ret = (uint64x2_t) __builtin_neon_vshrq_n_v((int8x16_t)__rev0, __p1, 51); \ 28263 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 28264 __ret; \ 28265 }) 28266 #endif 28267 28268 #ifdef __LITTLE_ENDIAN__ 28269 #define vshrq_n_u16(__p0, __p1) __extension__ ({ \ 28270 uint16x8_t __ret; \ 28271 uint16x8_t __s0 = __p0; \ 28272 __ret = (uint16x8_t) __builtin_neon_vshrq_n_v((int8x16_t)__s0, __p1, 49); \ 28273 __ret; \ 28274 }) 28275 #else 28276 #define vshrq_n_u16(__p0, __p1) __extension__ ({ \ 28277 uint16x8_t __ret; \ 28278 uint16x8_t __s0 = __p0; \ 28279 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 28280 __ret = (uint16x8_t) __builtin_neon_vshrq_n_v((int8x16_t)__rev0, __p1, 49); \ 28281 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 28282 __ret; \ 28283 }) 28284 #endif 28285 28286 #ifdef __LITTLE_ENDIAN__ 28287 #define vshrq_n_s8(__p0, __p1) __extension__ ({ \ 28288 int8x16_t __ret; \ 28289 int8x16_t __s0 = __p0; \ 28290 __ret = (int8x16_t) __builtin_neon_vshrq_n_v((int8x16_t)__s0, __p1, 32); \ 28291 __ret; \ 28292 }) 28293 #else 28294 #define vshrq_n_s8(__p0, __p1) __extension__ ({ \ 28295 int8x16_t __ret; \ 28296 int8x16_t __s0 = __p0; \ 28297 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 28298 __ret = (int8x16_t) __builtin_neon_vshrq_n_v((int8x16_t)__rev0, __p1, 32); \ 28299 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 28300 __ret; \ 28301 }) 28302 #endif 28303 28304 #ifdef __LITTLE_ENDIAN__ 28305 #define vshrq_n_s32(__p0, __p1) __extension__ ({ \ 28306 int32x4_t __ret; \ 28307 int32x4_t __s0 = __p0; \ 28308 __ret = (int32x4_t) __builtin_neon_vshrq_n_v((int8x16_t)__s0, __p1, 34); \ 28309 __ret; \ 28310 }) 28311 #else 28312 #define vshrq_n_s32(__p0, __p1) __extension__ ({ \ 28313 int32x4_t __ret; \ 28314 int32x4_t __s0 = __p0; \ 28315 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 28316 __ret = (int32x4_t) __builtin_neon_vshrq_n_v((int8x16_t)__rev0, __p1, 34); \ 28317 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 28318 __ret; \ 28319 }) 28320 #endif 28321 28322 #ifdef __LITTLE_ENDIAN__ 28323 #define vshrq_n_s64(__p0, __p1) __extension__ ({ \ 28324 int64x2_t __ret; \ 28325 int64x2_t __s0 = __p0; \ 28326 __ret = (int64x2_t) __builtin_neon_vshrq_n_v((int8x16_t)__s0, __p1, 35); \ 28327 __ret; \ 28328 }) 28329 #else 28330 #define vshrq_n_s64(__p0, __p1) __extension__ ({ \ 28331 int64x2_t __ret; \ 28332 int64x2_t __s0 = __p0; \ 28333 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 28334 __ret = (int64x2_t) __builtin_neon_vshrq_n_v((int8x16_t)__rev0, __p1, 35); \ 28335 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 28336 __ret; \ 28337 }) 28338 #endif 28339 28340 #ifdef __LITTLE_ENDIAN__ 28341 #define vshrq_n_s16(__p0, __p1) __extension__ ({ \ 28342 int16x8_t __ret; \ 28343 int16x8_t __s0 = __p0; \ 28344 __ret = (int16x8_t) __builtin_neon_vshrq_n_v((int8x16_t)__s0, __p1, 33); \ 28345 __ret; \ 28346 }) 28347 #else 28348 #define vshrq_n_s16(__p0, __p1) __extension__ ({ \ 28349 int16x8_t __ret; \ 28350 int16x8_t __s0 = __p0; \ 28351 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 28352 __ret = (int16x8_t) __builtin_neon_vshrq_n_v((int8x16_t)__rev0, __p1, 33); \ 28353 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 28354 __ret; \ 28355 }) 28356 #endif 28357 28358 #ifdef __LITTLE_ENDIAN__ 28359 #define vshr_n_u8(__p0, __p1) __extension__ ({ \ 28360 uint8x8_t __ret; \ 28361 uint8x8_t __s0 = __p0; \ 28362 __ret = (uint8x8_t) __builtin_neon_vshr_n_v((int8x8_t)__s0, __p1, 16); \ 28363 __ret; \ 28364 }) 28365 #else 28366 #define vshr_n_u8(__p0, __p1) __extension__ ({ \ 28367 uint8x8_t __ret; \ 28368 uint8x8_t __s0 = __p0; \ 28369 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 28370 __ret = (uint8x8_t) __builtin_neon_vshr_n_v((int8x8_t)__rev0, __p1, 16); \ 28371 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 28372 __ret; \ 28373 }) 28374 #endif 28375 28376 #ifdef __LITTLE_ENDIAN__ 28377 #define vshr_n_u32(__p0, __p1) __extension__ ({ \ 28378 uint32x2_t __ret; \ 28379 uint32x2_t __s0 = __p0; \ 28380 __ret = (uint32x2_t) __builtin_neon_vshr_n_v((int8x8_t)__s0, __p1, 18); \ 28381 __ret; \ 28382 }) 28383 #else 28384 #define vshr_n_u32(__p0, __p1) __extension__ ({ \ 28385 uint32x2_t __ret; \ 28386 uint32x2_t __s0 = __p0; \ 28387 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 28388 __ret = (uint32x2_t) __builtin_neon_vshr_n_v((int8x8_t)__rev0, __p1, 18); \ 28389 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 28390 __ret; \ 28391 }) 28392 #endif 28393 28394 #define vshr_n_u64(__p0, __p1) __extension__ ({ \ 28395 uint64x1_t __ret; \ 28396 uint64x1_t __s0 = __p0; \ 28397 __ret = (uint64x1_t) __builtin_neon_vshr_n_v((int8x8_t)__s0, __p1, 19); \ 28398 __ret; \ 28399 }) 28400 #ifdef __LITTLE_ENDIAN__ 28401 #define vshr_n_u16(__p0, __p1) __extension__ ({ \ 28402 uint16x4_t __ret; \ 28403 uint16x4_t __s0 = __p0; \ 28404 __ret = (uint16x4_t) __builtin_neon_vshr_n_v((int8x8_t)__s0, __p1, 17); \ 28405 __ret; \ 28406 }) 28407 #else 28408 #define vshr_n_u16(__p0, __p1) __extension__ ({ \ 28409 uint16x4_t __ret; \ 28410 uint16x4_t __s0 = __p0; \ 28411 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 28412 __ret = (uint16x4_t) __builtin_neon_vshr_n_v((int8x8_t)__rev0, __p1, 17); \ 28413 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 28414 __ret; \ 28415 }) 28416 #endif 28417 28418 #ifdef __LITTLE_ENDIAN__ 28419 #define vshr_n_s8(__p0, __p1) __extension__ ({ \ 28420 int8x8_t __ret; \ 28421 int8x8_t __s0 = __p0; \ 28422 __ret = (int8x8_t) __builtin_neon_vshr_n_v((int8x8_t)__s0, __p1, 0); \ 28423 __ret; \ 28424 }) 28425 #else 28426 #define vshr_n_s8(__p0, __p1) __extension__ ({ \ 28427 int8x8_t __ret; \ 28428 int8x8_t __s0 = __p0; \ 28429 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 28430 __ret = (int8x8_t) __builtin_neon_vshr_n_v((int8x8_t)__rev0, __p1, 0); \ 28431 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 28432 __ret; \ 28433 }) 28434 #endif 28435 28436 #ifdef __LITTLE_ENDIAN__ 28437 #define vshr_n_s32(__p0, __p1) __extension__ ({ \ 28438 int32x2_t __ret; \ 28439 int32x2_t __s0 = __p0; \ 28440 __ret = (int32x2_t) __builtin_neon_vshr_n_v((int8x8_t)__s0, __p1, 2); \ 28441 __ret; \ 28442 }) 28443 #else 28444 #define vshr_n_s32(__p0, __p1) __extension__ ({ \ 28445 int32x2_t __ret; \ 28446 int32x2_t __s0 = __p0; \ 28447 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 28448 __ret = (int32x2_t) __builtin_neon_vshr_n_v((int8x8_t)__rev0, __p1, 2); \ 28449 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 28450 __ret; \ 28451 }) 28452 #endif 28453 28454 #define vshr_n_s64(__p0, __p1) __extension__ ({ \ 28455 int64x1_t __ret; \ 28456 int64x1_t __s0 = __p0; \ 28457 __ret = (int64x1_t) __builtin_neon_vshr_n_v((int8x8_t)__s0, __p1, 3); \ 28458 __ret; \ 28459 }) 28460 #ifdef __LITTLE_ENDIAN__ 28461 #define vshr_n_s16(__p0, __p1) __extension__ ({ \ 28462 int16x4_t __ret; \ 28463 int16x4_t __s0 = __p0; \ 28464 __ret = (int16x4_t) __builtin_neon_vshr_n_v((int8x8_t)__s0, __p1, 1); \ 28465 __ret; \ 28466 }) 28467 #else 28468 #define vshr_n_s16(__p0, __p1) __extension__ ({ \ 28469 int16x4_t __ret; \ 28470 int16x4_t __s0 = __p0; \ 28471 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 28472 __ret = (int16x4_t) __builtin_neon_vshr_n_v((int8x8_t)__rev0, __p1, 1); \ 28473 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 28474 __ret; \ 28475 }) 28476 #endif 28477 28478 #ifdef __LITTLE_ENDIAN__ 28479 #define vshrn_n_u32(__p0, __p1) __extension__ ({ \ 28480 uint16x4_t __ret; \ 28481 uint32x4_t __s0 = __p0; \ 28482 __ret = (uint16x4_t) __builtin_neon_vshrn_n_v((int8x16_t)__s0, __p1, 17); \ 28483 __ret; \ 28484 }) 28485 #else 28486 #define vshrn_n_u32(__p0, __p1) __extension__ ({ \ 28487 uint16x4_t __ret; \ 28488 uint32x4_t __s0 = __p0; \ 28489 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 28490 __ret = (uint16x4_t) __builtin_neon_vshrn_n_v((int8x16_t)__rev0, __p1, 17); \ 28491 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 28492 __ret; \ 28493 }) 28494 #define __noswap_vshrn_n_u32(__p0, __p1) __extension__ ({ \ 28495 uint16x4_t __ret; \ 28496 uint32x4_t __s0 = __p0; \ 28497 __ret = (uint16x4_t) __builtin_neon_vshrn_n_v((int8x16_t)__s0, __p1, 17); \ 28498 __ret; \ 28499 }) 28500 #endif 28501 28502 #ifdef __LITTLE_ENDIAN__ 28503 #define vshrn_n_u64(__p0, __p1) __extension__ ({ \ 28504 uint32x2_t __ret; \ 28505 uint64x2_t __s0 = __p0; \ 28506 __ret = (uint32x2_t) __builtin_neon_vshrn_n_v((int8x16_t)__s0, __p1, 18); \ 28507 __ret; \ 28508 }) 28509 #else 28510 #define vshrn_n_u64(__p0, __p1) __extension__ ({ \ 28511 uint32x2_t __ret; \ 28512 uint64x2_t __s0 = __p0; \ 28513 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 28514 __ret = (uint32x2_t) __builtin_neon_vshrn_n_v((int8x16_t)__rev0, __p1, 18); \ 28515 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 28516 __ret; \ 28517 }) 28518 #define __noswap_vshrn_n_u64(__p0, __p1) __extension__ ({ \ 28519 uint32x2_t __ret; \ 28520 uint64x2_t __s0 = __p0; \ 28521 __ret = (uint32x2_t) __builtin_neon_vshrn_n_v((int8x16_t)__s0, __p1, 18); \ 28522 __ret; \ 28523 }) 28524 #endif 28525 28526 #ifdef __LITTLE_ENDIAN__ 28527 #define vshrn_n_u16(__p0, __p1) __extension__ ({ \ 28528 uint8x8_t __ret; \ 28529 uint16x8_t __s0 = __p0; \ 28530 __ret = (uint8x8_t) __builtin_neon_vshrn_n_v((int8x16_t)__s0, __p1, 16); \ 28531 __ret; \ 28532 }) 28533 #else 28534 #define vshrn_n_u16(__p0, __p1) __extension__ ({ \ 28535 uint8x8_t __ret; \ 28536 uint16x8_t __s0 = __p0; \ 28537 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 28538 __ret = (uint8x8_t) __builtin_neon_vshrn_n_v((int8x16_t)__rev0, __p1, 16); \ 28539 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 28540 __ret; \ 28541 }) 28542 #define __noswap_vshrn_n_u16(__p0, __p1) __extension__ ({ \ 28543 uint8x8_t __ret; \ 28544 uint16x8_t __s0 = __p0; \ 28545 __ret = (uint8x8_t) __builtin_neon_vshrn_n_v((int8x16_t)__s0, __p1, 16); \ 28546 __ret; \ 28547 }) 28548 #endif 28549 28550 #ifdef __LITTLE_ENDIAN__ 28551 #define vshrn_n_s32(__p0, __p1) __extension__ ({ \ 28552 int16x4_t __ret; \ 28553 int32x4_t __s0 = __p0; \ 28554 __ret = (int16x4_t) __builtin_neon_vshrn_n_v((int8x16_t)__s0, __p1, 1); \ 28555 __ret; \ 28556 }) 28557 #else 28558 #define vshrn_n_s32(__p0, __p1) __extension__ ({ \ 28559 int16x4_t __ret; \ 28560 int32x4_t __s0 = __p0; \ 28561 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 28562 __ret = (int16x4_t) __builtin_neon_vshrn_n_v((int8x16_t)__rev0, __p1, 1); \ 28563 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 28564 __ret; \ 28565 }) 28566 #define __noswap_vshrn_n_s32(__p0, __p1) __extension__ ({ \ 28567 int16x4_t __ret; \ 28568 int32x4_t __s0 = __p0; \ 28569 __ret = (int16x4_t) __builtin_neon_vshrn_n_v((int8x16_t)__s0, __p1, 1); \ 28570 __ret; \ 28571 }) 28572 #endif 28573 28574 #ifdef __LITTLE_ENDIAN__ 28575 #define vshrn_n_s64(__p0, __p1) __extension__ ({ \ 28576 int32x2_t __ret; \ 28577 int64x2_t __s0 = __p0; \ 28578 __ret = (int32x2_t) __builtin_neon_vshrn_n_v((int8x16_t)__s0, __p1, 2); \ 28579 __ret; \ 28580 }) 28581 #else 28582 #define vshrn_n_s64(__p0, __p1) __extension__ ({ \ 28583 int32x2_t __ret; \ 28584 int64x2_t __s0 = __p0; \ 28585 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 28586 __ret = (int32x2_t) __builtin_neon_vshrn_n_v((int8x16_t)__rev0, __p1, 2); \ 28587 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 28588 __ret; \ 28589 }) 28590 #define __noswap_vshrn_n_s64(__p0, __p1) __extension__ ({ \ 28591 int32x2_t __ret; \ 28592 int64x2_t __s0 = __p0; \ 28593 __ret = (int32x2_t) __builtin_neon_vshrn_n_v((int8x16_t)__s0, __p1, 2); \ 28594 __ret; \ 28595 }) 28596 #endif 28597 28598 #ifdef __LITTLE_ENDIAN__ 28599 #define vshrn_n_s16(__p0, __p1) __extension__ ({ \ 28600 int8x8_t __ret; \ 28601 int16x8_t __s0 = __p0; \ 28602 __ret = (int8x8_t) __builtin_neon_vshrn_n_v((int8x16_t)__s0, __p1, 0); \ 28603 __ret; \ 28604 }) 28605 #else 28606 #define vshrn_n_s16(__p0, __p1) __extension__ ({ \ 28607 int8x8_t __ret; \ 28608 int16x8_t __s0 = __p0; \ 28609 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 28610 __ret = (int8x8_t) __builtin_neon_vshrn_n_v((int8x16_t)__rev0, __p1, 0); \ 28611 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 28612 __ret; \ 28613 }) 28614 #define __noswap_vshrn_n_s16(__p0, __p1) __extension__ ({ \ 28615 int8x8_t __ret; \ 28616 int16x8_t __s0 = __p0; \ 28617 __ret = (int8x8_t) __builtin_neon_vshrn_n_v((int8x16_t)__s0, __p1, 0); \ 28618 __ret; \ 28619 }) 28620 #endif 28621 28622 #ifdef __LITTLE_ENDIAN__ 28623 #define vsli_n_p8(__p0, __p1, __p2) __extension__ ({ \ 28624 poly8x8_t __ret; \ 28625 poly8x8_t __s0 = __p0; \ 28626 poly8x8_t __s1 = __p1; \ 28627 __ret = (poly8x8_t) __builtin_neon_vsli_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 4); \ 28628 __ret; \ 28629 }) 28630 #else 28631 #define vsli_n_p8(__p0, __p1, __p2) __extension__ ({ \ 28632 poly8x8_t __ret; \ 28633 poly8x8_t __s0 = __p0; \ 28634 poly8x8_t __s1 = __p1; \ 28635 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 28636 poly8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 28637 __ret = (poly8x8_t) __builtin_neon_vsli_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 4); \ 28638 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 28639 __ret; \ 28640 }) 28641 #endif 28642 28643 #ifdef __LITTLE_ENDIAN__ 28644 #define vsli_n_p16(__p0, __p1, __p2) __extension__ ({ \ 28645 poly16x4_t __ret; \ 28646 poly16x4_t __s0 = __p0; \ 28647 poly16x4_t __s1 = __p1; \ 28648 __ret = (poly16x4_t) __builtin_neon_vsli_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 5); \ 28649 __ret; \ 28650 }) 28651 #else 28652 #define vsli_n_p16(__p0, __p1, __p2) __extension__ ({ \ 28653 poly16x4_t __ret; \ 28654 poly16x4_t __s0 = __p0; \ 28655 poly16x4_t __s1 = __p1; \ 28656 poly16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 28657 poly16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 28658 __ret = (poly16x4_t) __builtin_neon_vsli_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 5); \ 28659 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 28660 __ret; \ 28661 }) 28662 #endif 28663 28664 #ifdef __LITTLE_ENDIAN__ 28665 #define vsliq_n_p8(__p0, __p1, __p2) __extension__ ({ \ 28666 poly8x16_t __ret; \ 28667 poly8x16_t __s0 = __p0; \ 28668 poly8x16_t __s1 = __p1; \ 28669 __ret = (poly8x16_t) __builtin_neon_vsliq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 36); \ 28670 __ret; \ 28671 }) 28672 #else 28673 #define vsliq_n_p8(__p0, __p1, __p2) __extension__ ({ \ 28674 poly8x16_t __ret; \ 28675 poly8x16_t __s0 = __p0; \ 28676 poly8x16_t __s1 = __p1; \ 28677 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 28678 poly8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 28679 __ret = (poly8x16_t) __builtin_neon_vsliq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 36); \ 28680 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 28681 __ret; \ 28682 }) 28683 #endif 28684 28685 #ifdef __LITTLE_ENDIAN__ 28686 #define vsliq_n_p16(__p0, __p1, __p2) __extension__ ({ \ 28687 poly16x8_t __ret; \ 28688 poly16x8_t __s0 = __p0; \ 28689 poly16x8_t __s1 = __p1; \ 28690 __ret = (poly16x8_t) __builtin_neon_vsliq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 37); \ 28691 __ret; \ 28692 }) 28693 #else 28694 #define vsliq_n_p16(__p0, __p1, __p2) __extension__ ({ \ 28695 poly16x8_t __ret; \ 28696 poly16x8_t __s0 = __p0; \ 28697 poly16x8_t __s1 = __p1; \ 28698 poly16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 28699 poly16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 28700 __ret = (poly16x8_t) __builtin_neon_vsliq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 37); \ 28701 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 28702 __ret; \ 28703 }) 28704 #endif 28705 28706 #ifdef __LITTLE_ENDIAN__ 28707 #define vsliq_n_u8(__p0, __p1, __p2) __extension__ ({ \ 28708 uint8x16_t __ret; \ 28709 uint8x16_t __s0 = __p0; \ 28710 uint8x16_t __s1 = __p1; \ 28711 __ret = (uint8x16_t) __builtin_neon_vsliq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 48); \ 28712 __ret; \ 28713 }) 28714 #else 28715 #define vsliq_n_u8(__p0, __p1, __p2) __extension__ ({ \ 28716 uint8x16_t __ret; \ 28717 uint8x16_t __s0 = __p0; \ 28718 uint8x16_t __s1 = __p1; \ 28719 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 28720 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 28721 __ret = (uint8x16_t) __builtin_neon_vsliq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 48); \ 28722 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 28723 __ret; \ 28724 }) 28725 #endif 28726 28727 #ifdef __LITTLE_ENDIAN__ 28728 #define vsliq_n_u32(__p0, __p1, __p2) __extension__ ({ \ 28729 uint32x4_t __ret; \ 28730 uint32x4_t __s0 = __p0; \ 28731 uint32x4_t __s1 = __p1; \ 28732 __ret = (uint32x4_t) __builtin_neon_vsliq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 50); \ 28733 __ret; \ 28734 }) 28735 #else 28736 #define vsliq_n_u32(__p0, __p1, __p2) __extension__ ({ \ 28737 uint32x4_t __ret; \ 28738 uint32x4_t __s0 = __p0; \ 28739 uint32x4_t __s1 = __p1; \ 28740 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 28741 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 28742 __ret = (uint32x4_t) __builtin_neon_vsliq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 50); \ 28743 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 28744 __ret; \ 28745 }) 28746 #endif 28747 28748 #ifdef __LITTLE_ENDIAN__ 28749 #define vsliq_n_u64(__p0, __p1, __p2) __extension__ ({ \ 28750 uint64x2_t __ret; \ 28751 uint64x2_t __s0 = __p0; \ 28752 uint64x2_t __s1 = __p1; \ 28753 __ret = (uint64x2_t) __builtin_neon_vsliq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 51); \ 28754 __ret; \ 28755 }) 28756 #else 28757 #define vsliq_n_u64(__p0, __p1, __p2) __extension__ ({ \ 28758 uint64x2_t __ret; \ 28759 uint64x2_t __s0 = __p0; \ 28760 uint64x2_t __s1 = __p1; \ 28761 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 28762 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 28763 __ret = (uint64x2_t) __builtin_neon_vsliq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 51); \ 28764 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 28765 __ret; \ 28766 }) 28767 #endif 28768 28769 #ifdef __LITTLE_ENDIAN__ 28770 #define vsliq_n_u16(__p0, __p1, __p2) __extension__ ({ \ 28771 uint16x8_t __ret; \ 28772 uint16x8_t __s0 = __p0; \ 28773 uint16x8_t __s1 = __p1; \ 28774 __ret = (uint16x8_t) __builtin_neon_vsliq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 49); \ 28775 __ret; \ 28776 }) 28777 #else 28778 #define vsliq_n_u16(__p0, __p1, __p2) __extension__ ({ \ 28779 uint16x8_t __ret; \ 28780 uint16x8_t __s0 = __p0; \ 28781 uint16x8_t __s1 = __p1; \ 28782 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 28783 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 28784 __ret = (uint16x8_t) __builtin_neon_vsliq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 49); \ 28785 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 28786 __ret; \ 28787 }) 28788 #endif 28789 28790 #ifdef __LITTLE_ENDIAN__ 28791 #define vsliq_n_s8(__p0, __p1, __p2) __extension__ ({ \ 28792 int8x16_t __ret; \ 28793 int8x16_t __s0 = __p0; \ 28794 int8x16_t __s1 = __p1; \ 28795 __ret = (int8x16_t) __builtin_neon_vsliq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 32); \ 28796 __ret; \ 28797 }) 28798 #else 28799 #define vsliq_n_s8(__p0, __p1, __p2) __extension__ ({ \ 28800 int8x16_t __ret; \ 28801 int8x16_t __s0 = __p0; \ 28802 int8x16_t __s1 = __p1; \ 28803 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 28804 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 28805 __ret = (int8x16_t) __builtin_neon_vsliq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 32); \ 28806 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 28807 __ret; \ 28808 }) 28809 #endif 28810 28811 #ifdef __LITTLE_ENDIAN__ 28812 #define vsliq_n_s32(__p0, __p1, __p2) __extension__ ({ \ 28813 int32x4_t __ret; \ 28814 int32x4_t __s0 = __p0; \ 28815 int32x4_t __s1 = __p1; \ 28816 __ret = (int32x4_t) __builtin_neon_vsliq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 34); \ 28817 __ret; \ 28818 }) 28819 #else 28820 #define vsliq_n_s32(__p0, __p1, __p2) __extension__ ({ \ 28821 int32x4_t __ret; \ 28822 int32x4_t __s0 = __p0; \ 28823 int32x4_t __s1 = __p1; \ 28824 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 28825 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 28826 __ret = (int32x4_t) __builtin_neon_vsliq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 34); \ 28827 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 28828 __ret; \ 28829 }) 28830 #endif 28831 28832 #ifdef __LITTLE_ENDIAN__ 28833 #define vsliq_n_s64(__p0, __p1, __p2) __extension__ ({ \ 28834 int64x2_t __ret; \ 28835 int64x2_t __s0 = __p0; \ 28836 int64x2_t __s1 = __p1; \ 28837 __ret = (int64x2_t) __builtin_neon_vsliq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 35); \ 28838 __ret; \ 28839 }) 28840 #else 28841 #define vsliq_n_s64(__p0, __p1, __p2) __extension__ ({ \ 28842 int64x2_t __ret; \ 28843 int64x2_t __s0 = __p0; \ 28844 int64x2_t __s1 = __p1; \ 28845 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 28846 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 28847 __ret = (int64x2_t) __builtin_neon_vsliq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 35); \ 28848 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 28849 __ret; \ 28850 }) 28851 #endif 28852 28853 #ifdef __LITTLE_ENDIAN__ 28854 #define vsliq_n_s16(__p0, __p1, __p2) __extension__ ({ \ 28855 int16x8_t __ret; \ 28856 int16x8_t __s0 = __p0; \ 28857 int16x8_t __s1 = __p1; \ 28858 __ret = (int16x8_t) __builtin_neon_vsliq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 33); \ 28859 __ret; \ 28860 }) 28861 #else 28862 #define vsliq_n_s16(__p0, __p1, __p2) __extension__ ({ \ 28863 int16x8_t __ret; \ 28864 int16x8_t __s0 = __p0; \ 28865 int16x8_t __s1 = __p1; \ 28866 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 28867 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 28868 __ret = (int16x8_t) __builtin_neon_vsliq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 33); \ 28869 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 28870 __ret; \ 28871 }) 28872 #endif 28873 28874 #ifdef __LITTLE_ENDIAN__ 28875 #define vsli_n_u8(__p0, __p1, __p2) __extension__ ({ \ 28876 uint8x8_t __ret; \ 28877 uint8x8_t __s0 = __p0; \ 28878 uint8x8_t __s1 = __p1; \ 28879 __ret = (uint8x8_t) __builtin_neon_vsli_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 16); \ 28880 __ret; \ 28881 }) 28882 #else 28883 #define vsli_n_u8(__p0, __p1, __p2) __extension__ ({ \ 28884 uint8x8_t __ret; \ 28885 uint8x8_t __s0 = __p0; \ 28886 uint8x8_t __s1 = __p1; \ 28887 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 28888 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 28889 __ret = (uint8x8_t) __builtin_neon_vsli_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 16); \ 28890 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 28891 __ret; \ 28892 }) 28893 #endif 28894 28895 #ifdef __LITTLE_ENDIAN__ 28896 #define vsli_n_u32(__p0, __p1, __p2) __extension__ ({ \ 28897 uint32x2_t __ret; \ 28898 uint32x2_t __s0 = __p0; \ 28899 uint32x2_t __s1 = __p1; \ 28900 __ret = (uint32x2_t) __builtin_neon_vsli_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 18); \ 28901 __ret; \ 28902 }) 28903 #else 28904 #define vsli_n_u32(__p0, __p1, __p2) __extension__ ({ \ 28905 uint32x2_t __ret; \ 28906 uint32x2_t __s0 = __p0; \ 28907 uint32x2_t __s1 = __p1; \ 28908 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 28909 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 28910 __ret = (uint32x2_t) __builtin_neon_vsli_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 18); \ 28911 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 28912 __ret; \ 28913 }) 28914 #endif 28915 28916 #define vsli_n_u64(__p0, __p1, __p2) __extension__ ({ \ 28917 uint64x1_t __ret; \ 28918 uint64x1_t __s0 = __p0; \ 28919 uint64x1_t __s1 = __p1; \ 28920 __ret = (uint64x1_t) __builtin_neon_vsli_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 19); \ 28921 __ret; \ 28922 }) 28923 #ifdef __LITTLE_ENDIAN__ 28924 #define vsli_n_u16(__p0, __p1, __p2) __extension__ ({ \ 28925 uint16x4_t __ret; \ 28926 uint16x4_t __s0 = __p0; \ 28927 uint16x4_t __s1 = __p1; \ 28928 __ret = (uint16x4_t) __builtin_neon_vsli_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 17); \ 28929 __ret; \ 28930 }) 28931 #else 28932 #define vsli_n_u16(__p0, __p1, __p2) __extension__ ({ \ 28933 uint16x4_t __ret; \ 28934 uint16x4_t __s0 = __p0; \ 28935 uint16x4_t __s1 = __p1; \ 28936 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 28937 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 28938 __ret = (uint16x4_t) __builtin_neon_vsli_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 17); \ 28939 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 28940 __ret; \ 28941 }) 28942 #endif 28943 28944 #ifdef __LITTLE_ENDIAN__ 28945 #define vsli_n_s8(__p0, __p1, __p2) __extension__ ({ \ 28946 int8x8_t __ret; \ 28947 int8x8_t __s0 = __p0; \ 28948 int8x8_t __s1 = __p1; \ 28949 __ret = (int8x8_t) __builtin_neon_vsli_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 0); \ 28950 __ret; \ 28951 }) 28952 #else 28953 #define vsli_n_s8(__p0, __p1, __p2) __extension__ ({ \ 28954 int8x8_t __ret; \ 28955 int8x8_t __s0 = __p0; \ 28956 int8x8_t __s1 = __p1; \ 28957 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 28958 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 28959 __ret = (int8x8_t) __builtin_neon_vsli_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 0); \ 28960 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 28961 __ret; \ 28962 }) 28963 #endif 28964 28965 #ifdef __LITTLE_ENDIAN__ 28966 #define vsli_n_s32(__p0, __p1, __p2) __extension__ ({ \ 28967 int32x2_t __ret; \ 28968 int32x2_t __s0 = __p0; \ 28969 int32x2_t __s1 = __p1; \ 28970 __ret = (int32x2_t) __builtin_neon_vsli_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 2); \ 28971 __ret; \ 28972 }) 28973 #else 28974 #define vsli_n_s32(__p0, __p1, __p2) __extension__ ({ \ 28975 int32x2_t __ret; \ 28976 int32x2_t __s0 = __p0; \ 28977 int32x2_t __s1 = __p1; \ 28978 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 28979 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 28980 __ret = (int32x2_t) __builtin_neon_vsli_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 2); \ 28981 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 28982 __ret; \ 28983 }) 28984 #endif 28985 28986 #define vsli_n_s64(__p0, __p1, __p2) __extension__ ({ \ 28987 int64x1_t __ret; \ 28988 int64x1_t __s0 = __p0; \ 28989 int64x1_t __s1 = __p1; \ 28990 __ret = (int64x1_t) __builtin_neon_vsli_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 3); \ 28991 __ret; \ 28992 }) 28993 #ifdef __LITTLE_ENDIAN__ 28994 #define vsli_n_s16(__p0, __p1, __p2) __extension__ ({ \ 28995 int16x4_t __ret; \ 28996 int16x4_t __s0 = __p0; \ 28997 int16x4_t __s1 = __p1; \ 28998 __ret = (int16x4_t) __builtin_neon_vsli_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 1); \ 28999 __ret; \ 29000 }) 29001 #else 29002 #define vsli_n_s16(__p0, __p1, __p2) __extension__ ({ \ 29003 int16x4_t __ret; \ 29004 int16x4_t __s0 = __p0; \ 29005 int16x4_t __s1 = __p1; \ 29006 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 29007 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 29008 __ret = (int16x4_t) __builtin_neon_vsli_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 1); \ 29009 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 29010 __ret; \ 29011 }) 29012 #endif 29013 29014 #ifdef __LITTLE_ENDIAN__ 29015 #define vsraq_n_u8(__p0, __p1, __p2) __extension__ ({ \ 29016 uint8x16_t __ret; \ 29017 uint8x16_t __s0 = __p0; \ 29018 uint8x16_t __s1 = __p1; \ 29019 __ret = (uint8x16_t) __builtin_neon_vsraq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 48); \ 29020 __ret; \ 29021 }) 29022 #else 29023 #define vsraq_n_u8(__p0, __p1, __p2) __extension__ ({ \ 29024 uint8x16_t __ret; \ 29025 uint8x16_t __s0 = __p0; \ 29026 uint8x16_t __s1 = __p1; \ 29027 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 29028 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 29029 __ret = (uint8x16_t) __builtin_neon_vsraq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 48); \ 29030 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 29031 __ret; \ 29032 }) 29033 #endif 29034 29035 #ifdef __LITTLE_ENDIAN__ 29036 #define vsraq_n_u32(__p0, __p1, __p2) __extension__ ({ \ 29037 uint32x4_t __ret; \ 29038 uint32x4_t __s0 = __p0; \ 29039 uint32x4_t __s1 = __p1; \ 29040 __ret = (uint32x4_t) __builtin_neon_vsraq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 50); \ 29041 __ret; \ 29042 }) 29043 #else 29044 #define vsraq_n_u32(__p0, __p1, __p2) __extension__ ({ \ 29045 uint32x4_t __ret; \ 29046 uint32x4_t __s0 = __p0; \ 29047 uint32x4_t __s1 = __p1; \ 29048 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 29049 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 29050 __ret = (uint32x4_t) __builtin_neon_vsraq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 50); \ 29051 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 29052 __ret; \ 29053 }) 29054 #endif 29055 29056 #ifdef __LITTLE_ENDIAN__ 29057 #define vsraq_n_u64(__p0, __p1, __p2) __extension__ ({ \ 29058 uint64x2_t __ret; \ 29059 uint64x2_t __s0 = __p0; \ 29060 uint64x2_t __s1 = __p1; \ 29061 __ret = (uint64x2_t) __builtin_neon_vsraq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 51); \ 29062 __ret; \ 29063 }) 29064 #else 29065 #define vsraq_n_u64(__p0, __p1, __p2) __extension__ ({ \ 29066 uint64x2_t __ret; \ 29067 uint64x2_t __s0 = __p0; \ 29068 uint64x2_t __s1 = __p1; \ 29069 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 29070 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 29071 __ret = (uint64x2_t) __builtin_neon_vsraq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 51); \ 29072 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 29073 __ret; \ 29074 }) 29075 #endif 29076 29077 #ifdef __LITTLE_ENDIAN__ 29078 #define vsraq_n_u16(__p0, __p1, __p2) __extension__ ({ \ 29079 uint16x8_t __ret; \ 29080 uint16x8_t __s0 = __p0; \ 29081 uint16x8_t __s1 = __p1; \ 29082 __ret = (uint16x8_t) __builtin_neon_vsraq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 49); \ 29083 __ret; \ 29084 }) 29085 #else 29086 #define vsraq_n_u16(__p0, __p1, __p2) __extension__ ({ \ 29087 uint16x8_t __ret; \ 29088 uint16x8_t __s0 = __p0; \ 29089 uint16x8_t __s1 = __p1; \ 29090 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 29091 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 29092 __ret = (uint16x8_t) __builtin_neon_vsraq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 49); \ 29093 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 29094 __ret; \ 29095 }) 29096 #endif 29097 29098 #ifdef __LITTLE_ENDIAN__ 29099 #define vsraq_n_s8(__p0, __p1, __p2) __extension__ ({ \ 29100 int8x16_t __ret; \ 29101 int8x16_t __s0 = __p0; \ 29102 int8x16_t __s1 = __p1; \ 29103 __ret = (int8x16_t) __builtin_neon_vsraq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 32); \ 29104 __ret; \ 29105 }) 29106 #else 29107 #define vsraq_n_s8(__p0, __p1, __p2) __extension__ ({ \ 29108 int8x16_t __ret; \ 29109 int8x16_t __s0 = __p0; \ 29110 int8x16_t __s1 = __p1; \ 29111 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 29112 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 29113 __ret = (int8x16_t) __builtin_neon_vsraq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 32); \ 29114 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 29115 __ret; \ 29116 }) 29117 #endif 29118 29119 #ifdef __LITTLE_ENDIAN__ 29120 #define vsraq_n_s32(__p0, __p1, __p2) __extension__ ({ \ 29121 int32x4_t __ret; \ 29122 int32x4_t __s0 = __p0; \ 29123 int32x4_t __s1 = __p1; \ 29124 __ret = (int32x4_t) __builtin_neon_vsraq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 34); \ 29125 __ret; \ 29126 }) 29127 #else 29128 #define vsraq_n_s32(__p0, __p1, __p2) __extension__ ({ \ 29129 int32x4_t __ret; \ 29130 int32x4_t __s0 = __p0; \ 29131 int32x4_t __s1 = __p1; \ 29132 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 29133 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 29134 __ret = (int32x4_t) __builtin_neon_vsraq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 34); \ 29135 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 29136 __ret; \ 29137 }) 29138 #endif 29139 29140 #ifdef __LITTLE_ENDIAN__ 29141 #define vsraq_n_s64(__p0, __p1, __p2) __extension__ ({ \ 29142 int64x2_t __ret; \ 29143 int64x2_t __s0 = __p0; \ 29144 int64x2_t __s1 = __p1; \ 29145 __ret = (int64x2_t) __builtin_neon_vsraq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 35); \ 29146 __ret; \ 29147 }) 29148 #else 29149 #define vsraq_n_s64(__p0, __p1, __p2) __extension__ ({ \ 29150 int64x2_t __ret; \ 29151 int64x2_t __s0 = __p0; \ 29152 int64x2_t __s1 = __p1; \ 29153 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 29154 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 29155 __ret = (int64x2_t) __builtin_neon_vsraq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 35); \ 29156 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 29157 __ret; \ 29158 }) 29159 #endif 29160 29161 #ifdef __LITTLE_ENDIAN__ 29162 #define vsraq_n_s16(__p0, __p1, __p2) __extension__ ({ \ 29163 int16x8_t __ret; \ 29164 int16x8_t __s0 = __p0; \ 29165 int16x8_t __s1 = __p1; \ 29166 __ret = (int16x8_t) __builtin_neon_vsraq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 33); \ 29167 __ret; \ 29168 }) 29169 #else 29170 #define vsraq_n_s16(__p0, __p1, __p2) __extension__ ({ \ 29171 int16x8_t __ret; \ 29172 int16x8_t __s0 = __p0; \ 29173 int16x8_t __s1 = __p1; \ 29174 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 29175 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 29176 __ret = (int16x8_t) __builtin_neon_vsraq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 33); \ 29177 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 29178 __ret; \ 29179 }) 29180 #endif 29181 29182 #ifdef __LITTLE_ENDIAN__ 29183 #define vsra_n_u8(__p0, __p1, __p2) __extension__ ({ \ 29184 uint8x8_t __ret; \ 29185 uint8x8_t __s0 = __p0; \ 29186 uint8x8_t __s1 = __p1; \ 29187 __ret = (uint8x8_t) __builtin_neon_vsra_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 16); \ 29188 __ret; \ 29189 }) 29190 #else 29191 #define vsra_n_u8(__p0, __p1, __p2) __extension__ ({ \ 29192 uint8x8_t __ret; \ 29193 uint8x8_t __s0 = __p0; \ 29194 uint8x8_t __s1 = __p1; \ 29195 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 29196 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 29197 __ret = (uint8x8_t) __builtin_neon_vsra_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 16); \ 29198 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 29199 __ret; \ 29200 }) 29201 #endif 29202 29203 #ifdef __LITTLE_ENDIAN__ 29204 #define vsra_n_u32(__p0, __p1, __p2) __extension__ ({ \ 29205 uint32x2_t __ret; \ 29206 uint32x2_t __s0 = __p0; \ 29207 uint32x2_t __s1 = __p1; \ 29208 __ret = (uint32x2_t) __builtin_neon_vsra_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 18); \ 29209 __ret; \ 29210 }) 29211 #else 29212 #define vsra_n_u32(__p0, __p1, __p2) __extension__ ({ \ 29213 uint32x2_t __ret; \ 29214 uint32x2_t __s0 = __p0; \ 29215 uint32x2_t __s1 = __p1; \ 29216 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 29217 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 29218 __ret = (uint32x2_t) __builtin_neon_vsra_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 18); \ 29219 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 29220 __ret; \ 29221 }) 29222 #endif 29223 29224 #define vsra_n_u64(__p0, __p1, __p2) __extension__ ({ \ 29225 uint64x1_t __ret; \ 29226 uint64x1_t __s0 = __p0; \ 29227 uint64x1_t __s1 = __p1; \ 29228 __ret = (uint64x1_t) __builtin_neon_vsra_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 19); \ 29229 __ret; \ 29230 }) 29231 #ifdef __LITTLE_ENDIAN__ 29232 #define vsra_n_u16(__p0, __p1, __p2) __extension__ ({ \ 29233 uint16x4_t __ret; \ 29234 uint16x4_t __s0 = __p0; \ 29235 uint16x4_t __s1 = __p1; \ 29236 __ret = (uint16x4_t) __builtin_neon_vsra_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 17); \ 29237 __ret; \ 29238 }) 29239 #else 29240 #define vsra_n_u16(__p0, __p1, __p2) __extension__ ({ \ 29241 uint16x4_t __ret; \ 29242 uint16x4_t __s0 = __p0; \ 29243 uint16x4_t __s1 = __p1; \ 29244 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 29245 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 29246 __ret = (uint16x4_t) __builtin_neon_vsra_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 17); \ 29247 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 29248 __ret; \ 29249 }) 29250 #endif 29251 29252 #ifdef __LITTLE_ENDIAN__ 29253 #define vsra_n_s8(__p0, __p1, __p2) __extension__ ({ \ 29254 int8x8_t __ret; \ 29255 int8x8_t __s0 = __p0; \ 29256 int8x8_t __s1 = __p1; \ 29257 __ret = (int8x8_t) __builtin_neon_vsra_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 0); \ 29258 __ret; \ 29259 }) 29260 #else 29261 #define vsra_n_s8(__p0, __p1, __p2) __extension__ ({ \ 29262 int8x8_t __ret; \ 29263 int8x8_t __s0 = __p0; \ 29264 int8x8_t __s1 = __p1; \ 29265 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 29266 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 29267 __ret = (int8x8_t) __builtin_neon_vsra_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 0); \ 29268 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 29269 __ret; \ 29270 }) 29271 #endif 29272 29273 #ifdef __LITTLE_ENDIAN__ 29274 #define vsra_n_s32(__p0, __p1, __p2) __extension__ ({ \ 29275 int32x2_t __ret; \ 29276 int32x2_t __s0 = __p0; \ 29277 int32x2_t __s1 = __p1; \ 29278 __ret = (int32x2_t) __builtin_neon_vsra_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 2); \ 29279 __ret; \ 29280 }) 29281 #else 29282 #define vsra_n_s32(__p0, __p1, __p2) __extension__ ({ \ 29283 int32x2_t __ret; \ 29284 int32x2_t __s0 = __p0; \ 29285 int32x2_t __s1 = __p1; \ 29286 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 29287 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 29288 __ret = (int32x2_t) __builtin_neon_vsra_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 2); \ 29289 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 29290 __ret; \ 29291 }) 29292 #endif 29293 29294 #define vsra_n_s64(__p0, __p1, __p2) __extension__ ({ \ 29295 int64x1_t __ret; \ 29296 int64x1_t __s0 = __p0; \ 29297 int64x1_t __s1 = __p1; \ 29298 __ret = (int64x1_t) __builtin_neon_vsra_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 3); \ 29299 __ret; \ 29300 }) 29301 #ifdef __LITTLE_ENDIAN__ 29302 #define vsra_n_s16(__p0, __p1, __p2) __extension__ ({ \ 29303 int16x4_t __ret; \ 29304 int16x4_t __s0 = __p0; \ 29305 int16x4_t __s1 = __p1; \ 29306 __ret = (int16x4_t) __builtin_neon_vsra_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 1); \ 29307 __ret; \ 29308 }) 29309 #else 29310 #define vsra_n_s16(__p0, __p1, __p2) __extension__ ({ \ 29311 int16x4_t __ret; \ 29312 int16x4_t __s0 = __p0; \ 29313 int16x4_t __s1 = __p1; \ 29314 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 29315 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 29316 __ret = (int16x4_t) __builtin_neon_vsra_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 1); \ 29317 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 29318 __ret; \ 29319 }) 29320 #endif 29321 29322 #ifdef __LITTLE_ENDIAN__ 29323 #define vsri_n_p8(__p0, __p1, __p2) __extension__ ({ \ 29324 poly8x8_t __ret; \ 29325 poly8x8_t __s0 = __p0; \ 29326 poly8x8_t __s1 = __p1; \ 29327 __ret = (poly8x8_t) __builtin_neon_vsri_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 4); \ 29328 __ret; \ 29329 }) 29330 #else 29331 #define vsri_n_p8(__p0, __p1, __p2) __extension__ ({ \ 29332 poly8x8_t __ret; \ 29333 poly8x8_t __s0 = __p0; \ 29334 poly8x8_t __s1 = __p1; \ 29335 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 29336 poly8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 29337 __ret = (poly8x8_t) __builtin_neon_vsri_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 4); \ 29338 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 29339 __ret; \ 29340 }) 29341 #endif 29342 29343 #ifdef __LITTLE_ENDIAN__ 29344 #define vsri_n_p16(__p0, __p1, __p2) __extension__ ({ \ 29345 poly16x4_t __ret; \ 29346 poly16x4_t __s0 = __p0; \ 29347 poly16x4_t __s1 = __p1; \ 29348 __ret = (poly16x4_t) __builtin_neon_vsri_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 5); \ 29349 __ret; \ 29350 }) 29351 #else 29352 #define vsri_n_p16(__p0, __p1, __p2) __extension__ ({ \ 29353 poly16x4_t __ret; \ 29354 poly16x4_t __s0 = __p0; \ 29355 poly16x4_t __s1 = __p1; \ 29356 poly16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 29357 poly16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 29358 __ret = (poly16x4_t) __builtin_neon_vsri_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 5); \ 29359 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 29360 __ret; \ 29361 }) 29362 #endif 29363 29364 #ifdef __LITTLE_ENDIAN__ 29365 #define vsriq_n_p8(__p0, __p1, __p2) __extension__ ({ \ 29366 poly8x16_t __ret; \ 29367 poly8x16_t __s0 = __p0; \ 29368 poly8x16_t __s1 = __p1; \ 29369 __ret = (poly8x16_t) __builtin_neon_vsriq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 36); \ 29370 __ret; \ 29371 }) 29372 #else 29373 #define vsriq_n_p8(__p0, __p1, __p2) __extension__ ({ \ 29374 poly8x16_t __ret; \ 29375 poly8x16_t __s0 = __p0; \ 29376 poly8x16_t __s1 = __p1; \ 29377 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 29378 poly8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 29379 __ret = (poly8x16_t) __builtin_neon_vsriq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 36); \ 29380 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 29381 __ret; \ 29382 }) 29383 #endif 29384 29385 #ifdef __LITTLE_ENDIAN__ 29386 #define vsriq_n_p16(__p0, __p1, __p2) __extension__ ({ \ 29387 poly16x8_t __ret; \ 29388 poly16x8_t __s0 = __p0; \ 29389 poly16x8_t __s1 = __p1; \ 29390 __ret = (poly16x8_t) __builtin_neon_vsriq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 37); \ 29391 __ret; \ 29392 }) 29393 #else 29394 #define vsriq_n_p16(__p0, __p1, __p2) __extension__ ({ \ 29395 poly16x8_t __ret; \ 29396 poly16x8_t __s0 = __p0; \ 29397 poly16x8_t __s1 = __p1; \ 29398 poly16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 29399 poly16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 29400 __ret = (poly16x8_t) __builtin_neon_vsriq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 37); \ 29401 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 29402 __ret; \ 29403 }) 29404 #endif 29405 29406 #ifdef __LITTLE_ENDIAN__ 29407 #define vsriq_n_u8(__p0, __p1, __p2) __extension__ ({ \ 29408 uint8x16_t __ret; \ 29409 uint8x16_t __s0 = __p0; \ 29410 uint8x16_t __s1 = __p1; \ 29411 __ret = (uint8x16_t) __builtin_neon_vsriq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 48); \ 29412 __ret; \ 29413 }) 29414 #else 29415 #define vsriq_n_u8(__p0, __p1, __p2) __extension__ ({ \ 29416 uint8x16_t __ret; \ 29417 uint8x16_t __s0 = __p0; \ 29418 uint8x16_t __s1 = __p1; \ 29419 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 29420 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 29421 __ret = (uint8x16_t) __builtin_neon_vsriq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 48); \ 29422 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 29423 __ret; \ 29424 }) 29425 #endif 29426 29427 #ifdef __LITTLE_ENDIAN__ 29428 #define vsriq_n_u32(__p0, __p1, __p2) __extension__ ({ \ 29429 uint32x4_t __ret; \ 29430 uint32x4_t __s0 = __p0; \ 29431 uint32x4_t __s1 = __p1; \ 29432 __ret = (uint32x4_t) __builtin_neon_vsriq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 50); \ 29433 __ret; \ 29434 }) 29435 #else 29436 #define vsriq_n_u32(__p0, __p1, __p2) __extension__ ({ \ 29437 uint32x4_t __ret; \ 29438 uint32x4_t __s0 = __p0; \ 29439 uint32x4_t __s1 = __p1; \ 29440 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 29441 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 29442 __ret = (uint32x4_t) __builtin_neon_vsriq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 50); \ 29443 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 29444 __ret; \ 29445 }) 29446 #endif 29447 29448 #ifdef __LITTLE_ENDIAN__ 29449 #define vsriq_n_u64(__p0, __p1, __p2) __extension__ ({ \ 29450 uint64x2_t __ret; \ 29451 uint64x2_t __s0 = __p0; \ 29452 uint64x2_t __s1 = __p1; \ 29453 __ret = (uint64x2_t) __builtin_neon_vsriq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 51); \ 29454 __ret; \ 29455 }) 29456 #else 29457 #define vsriq_n_u64(__p0, __p1, __p2) __extension__ ({ \ 29458 uint64x2_t __ret; \ 29459 uint64x2_t __s0 = __p0; \ 29460 uint64x2_t __s1 = __p1; \ 29461 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 29462 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 29463 __ret = (uint64x2_t) __builtin_neon_vsriq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 51); \ 29464 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 29465 __ret; \ 29466 }) 29467 #endif 29468 29469 #ifdef __LITTLE_ENDIAN__ 29470 #define vsriq_n_u16(__p0, __p1, __p2) __extension__ ({ \ 29471 uint16x8_t __ret; \ 29472 uint16x8_t __s0 = __p0; \ 29473 uint16x8_t __s1 = __p1; \ 29474 __ret = (uint16x8_t) __builtin_neon_vsriq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 49); \ 29475 __ret; \ 29476 }) 29477 #else 29478 #define vsriq_n_u16(__p0, __p1, __p2) __extension__ ({ \ 29479 uint16x8_t __ret; \ 29480 uint16x8_t __s0 = __p0; \ 29481 uint16x8_t __s1 = __p1; \ 29482 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 29483 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 29484 __ret = (uint16x8_t) __builtin_neon_vsriq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 49); \ 29485 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 29486 __ret; \ 29487 }) 29488 #endif 29489 29490 #ifdef __LITTLE_ENDIAN__ 29491 #define vsriq_n_s8(__p0, __p1, __p2) __extension__ ({ \ 29492 int8x16_t __ret; \ 29493 int8x16_t __s0 = __p0; \ 29494 int8x16_t __s1 = __p1; \ 29495 __ret = (int8x16_t) __builtin_neon_vsriq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 32); \ 29496 __ret; \ 29497 }) 29498 #else 29499 #define vsriq_n_s8(__p0, __p1, __p2) __extension__ ({ \ 29500 int8x16_t __ret; \ 29501 int8x16_t __s0 = __p0; \ 29502 int8x16_t __s1 = __p1; \ 29503 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 29504 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 29505 __ret = (int8x16_t) __builtin_neon_vsriq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 32); \ 29506 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 29507 __ret; \ 29508 }) 29509 #endif 29510 29511 #ifdef __LITTLE_ENDIAN__ 29512 #define vsriq_n_s32(__p0, __p1, __p2) __extension__ ({ \ 29513 int32x4_t __ret; \ 29514 int32x4_t __s0 = __p0; \ 29515 int32x4_t __s1 = __p1; \ 29516 __ret = (int32x4_t) __builtin_neon_vsriq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 34); \ 29517 __ret; \ 29518 }) 29519 #else 29520 #define vsriq_n_s32(__p0, __p1, __p2) __extension__ ({ \ 29521 int32x4_t __ret; \ 29522 int32x4_t __s0 = __p0; \ 29523 int32x4_t __s1 = __p1; \ 29524 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 29525 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 29526 __ret = (int32x4_t) __builtin_neon_vsriq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 34); \ 29527 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 29528 __ret; \ 29529 }) 29530 #endif 29531 29532 #ifdef __LITTLE_ENDIAN__ 29533 #define vsriq_n_s64(__p0, __p1, __p2) __extension__ ({ \ 29534 int64x2_t __ret; \ 29535 int64x2_t __s0 = __p0; \ 29536 int64x2_t __s1 = __p1; \ 29537 __ret = (int64x2_t) __builtin_neon_vsriq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 35); \ 29538 __ret; \ 29539 }) 29540 #else 29541 #define vsriq_n_s64(__p0, __p1, __p2) __extension__ ({ \ 29542 int64x2_t __ret; \ 29543 int64x2_t __s0 = __p0; \ 29544 int64x2_t __s1 = __p1; \ 29545 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 29546 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 29547 __ret = (int64x2_t) __builtin_neon_vsriq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 35); \ 29548 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 29549 __ret; \ 29550 }) 29551 #endif 29552 29553 #ifdef __LITTLE_ENDIAN__ 29554 #define vsriq_n_s16(__p0, __p1, __p2) __extension__ ({ \ 29555 int16x8_t __ret; \ 29556 int16x8_t __s0 = __p0; \ 29557 int16x8_t __s1 = __p1; \ 29558 __ret = (int16x8_t) __builtin_neon_vsriq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 33); \ 29559 __ret; \ 29560 }) 29561 #else 29562 #define vsriq_n_s16(__p0, __p1, __p2) __extension__ ({ \ 29563 int16x8_t __ret; \ 29564 int16x8_t __s0 = __p0; \ 29565 int16x8_t __s1 = __p1; \ 29566 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 29567 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 29568 __ret = (int16x8_t) __builtin_neon_vsriq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 33); \ 29569 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 29570 __ret; \ 29571 }) 29572 #endif 29573 29574 #ifdef __LITTLE_ENDIAN__ 29575 #define vsri_n_u8(__p0, __p1, __p2) __extension__ ({ \ 29576 uint8x8_t __ret; \ 29577 uint8x8_t __s0 = __p0; \ 29578 uint8x8_t __s1 = __p1; \ 29579 __ret = (uint8x8_t) __builtin_neon_vsri_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 16); \ 29580 __ret; \ 29581 }) 29582 #else 29583 #define vsri_n_u8(__p0, __p1, __p2) __extension__ ({ \ 29584 uint8x8_t __ret; \ 29585 uint8x8_t __s0 = __p0; \ 29586 uint8x8_t __s1 = __p1; \ 29587 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 29588 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 29589 __ret = (uint8x8_t) __builtin_neon_vsri_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 16); \ 29590 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 29591 __ret; \ 29592 }) 29593 #endif 29594 29595 #ifdef __LITTLE_ENDIAN__ 29596 #define vsri_n_u32(__p0, __p1, __p2) __extension__ ({ \ 29597 uint32x2_t __ret; \ 29598 uint32x2_t __s0 = __p0; \ 29599 uint32x2_t __s1 = __p1; \ 29600 __ret = (uint32x2_t) __builtin_neon_vsri_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 18); \ 29601 __ret; \ 29602 }) 29603 #else 29604 #define vsri_n_u32(__p0, __p1, __p2) __extension__ ({ \ 29605 uint32x2_t __ret; \ 29606 uint32x2_t __s0 = __p0; \ 29607 uint32x2_t __s1 = __p1; \ 29608 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 29609 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 29610 __ret = (uint32x2_t) __builtin_neon_vsri_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 18); \ 29611 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 29612 __ret; \ 29613 }) 29614 #endif 29615 29616 #define vsri_n_u64(__p0, __p1, __p2) __extension__ ({ \ 29617 uint64x1_t __ret; \ 29618 uint64x1_t __s0 = __p0; \ 29619 uint64x1_t __s1 = __p1; \ 29620 __ret = (uint64x1_t) __builtin_neon_vsri_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 19); \ 29621 __ret; \ 29622 }) 29623 #ifdef __LITTLE_ENDIAN__ 29624 #define vsri_n_u16(__p0, __p1, __p2) __extension__ ({ \ 29625 uint16x4_t __ret; \ 29626 uint16x4_t __s0 = __p0; \ 29627 uint16x4_t __s1 = __p1; \ 29628 __ret = (uint16x4_t) __builtin_neon_vsri_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 17); \ 29629 __ret; \ 29630 }) 29631 #else 29632 #define vsri_n_u16(__p0, __p1, __p2) __extension__ ({ \ 29633 uint16x4_t __ret; \ 29634 uint16x4_t __s0 = __p0; \ 29635 uint16x4_t __s1 = __p1; \ 29636 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 29637 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 29638 __ret = (uint16x4_t) __builtin_neon_vsri_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 17); \ 29639 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 29640 __ret; \ 29641 }) 29642 #endif 29643 29644 #ifdef __LITTLE_ENDIAN__ 29645 #define vsri_n_s8(__p0, __p1, __p2) __extension__ ({ \ 29646 int8x8_t __ret; \ 29647 int8x8_t __s0 = __p0; \ 29648 int8x8_t __s1 = __p1; \ 29649 __ret = (int8x8_t) __builtin_neon_vsri_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 0); \ 29650 __ret; \ 29651 }) 29652 #else 29653 #define vsri_n_s8(__p0, __p1, __p2) __extension__ ({ \ 29654 int8x8_t __ret; \ 29655 int8x8_t __s0 = __p0; \ 29656 int8x8_t __s1 = __p1; \ 29657 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 29658 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 29659 __ret = (int8x8_t) __builtin_neon_vsri_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 0); \ 29660 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 29661 __ret; \ 29662 }) 29663 #endif 29664 29665 #ifdef __LITTLE_ENDIAN__ 29666 #define vsri_n_s32(__p0, __p1, __p2) __extension__ ({ \ 29667 int32x2_t __ret; \ 29668 int32x2_t __s0 = __p0; \ 29669 int32x2_t __s1 = __p1; \ 29670 __ret = (int32x2_t) __builtin_neon_vsri_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 2); \ 29671 __ret; \ 29672 }) 29673 #else 29674 #define vsri_n_s32(__p0, __p1, __p2) __extension__ ({ \ 29675 int32x2_t __ret; \ 29676 int32x2_t __s0 = __p0; \ 29677 int32x2_t __s1 = __p1; \ 29678 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 29679 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 29680 __ret = (int32x2_t) __builtin_neon_vsri_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 2); \ 29681 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 29682 __ret; \ 29683 }) 29684 #endif 29685 29686 #define vsri_n_s64(__p0, __p1, __p2) __extension__ ({ \ 29687 int64x1_t __ret; \ 29688 int64x1_t __s0 = __p0; \ 29689 int64x1_t __s1 = __p1; \ 29690 __ret = (int64x1_t) __builtin_neon_vsri_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 3); \ 29691 __ret; \ 29692 }) 29693 #ifdef __LITTLE_ENDIAN__ 29694 #define vsri_n_s16(__p0, __p1, __p2) __extension__ ({ \ 29695 int16x4_t __ret; \ 29696 int16x4_t __s0 = __p0; \ 29697 int16x4_t __s1 = __p1; \ 29698 __ret = (int16x4_t) __builtin_neon_vsri_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 1); \ 29699 __ret; \ 29700 }) 29701 #else 29702 #define vsri_n_s16(__p0, __p1, __p2) __extension__ ({ \ 29703 int16x4_t __ret; \ 29704 int16x4_t __s0 = __p0; \ 29705 int16x4_t __s1 = __p1; \ 29706 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 29707 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 29708 __ret = (int16x4_t) __builtin_neon_vsri_n_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 1); \ 29709 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 29710 __ret; \ 29711 }) 29712 #endif 29713 29714 #ifdef __LITTLE_ENDIAN__ 29715 #define vst1_p8(__p0, __p1) __extension__ ({ \ 29716 poly8x8_t __s1 = __p1; \ 29717 __builtin_neon_vst1_v(__p0, (int8x8_t)__s1, 4); \ 29718 }) 29719 #else 29720 #define vst1_p8(__p0, __p1) __extension__ ({ \ 29721 poly8x8_t __s1 = __p1; \ 29722 poly8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 29723 __builtin_neon_vst1_v(__p0, (int8x8_t)__rev1, 4); \ 29724 }) 29725 #endif 29726 29727 #ifdef __LITTLE_ENDIAN__ 29728 #define vst1_p16(__p0, __p1) __extension__ ({ \ 29729 poly16x4_t __s1 = __p1; \ 29730 __builtin_neon_vst1_v(__p0, (int8x8_t)__s1, 5); \ 29731 }) 29732 #else 29733 #define vst1_p16(__p0, __p1) __extension__ ({ \ 29734 poly16x4_t __s1 = __p1; \ 29735 poly16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 29736 __builtin_neon_vst1_v(__p0, (int8x8_t)__rev1, 5); \ 29737 }) 29738 #endif 29739 29740 #ifdef __LITTLE_ENDIAN__ 29741 #define vst1q_p8(__p0, __p1) __extension__ ({ \ 29742 poly8x16_t __s1 = __p1; \ 29743 __builtin_neon_vst1q_v(__p0, (int8x16_t)__s1, 36); \ 29744 }) 29745 #else 29746 #define vst1q_p8(__p0, __p1) __extension__ ({ \ 29747 poly8x16_t __s1 = __p1; \ 29748 poly8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 29749 __builtin_neon_vst1q_v(__p0, (int8x16_t)__rev1, 36); \ 29750 }) 29751 #endif 29752 29753 #ifdef __LITTLE_ENDIAN__ 29754 #define vst1q_p16(__p0, __p1) __extension__ ({ \ 29755 poly16x8_t __s1 = __p1; \ 29756 __builtin_neon_vst1q_v(__p0, (int8x16_t)__s1, 37); \ 29757 }) 29758 #else 29759 #define vst1q_p16(__p0, __p1) __extension__ ({ \ 29760 poly16x8_t __s1 = __p1; \ 29761 poly16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 29762 __builtin_neon_vst1q_v(__p0, (int8x16_t)__rev1, 37); \ 29763 }) 29764 #endif 29765 29766 #ifdef __LITTLE_ENDIAN__ 29767 #define vst1q_u8(__p0, __p1) __extension__ ({ \ 29768 uint8x16_t __s1 = __p1; \ 29769 __builtin_neon_vst1q_v(__p0, (int8x16_t)__s1, 48); \ 29770 }) 29771 #else 29772 #define vst1q_u8(__p0, __p1) __extension__ ({ \ 29773 uint8x16_t __s1 = __p1; \ 29774 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 29775 __builtin_neon_vst1q_v(__p0, (int8x16_t)__rev1, 48); \ 29776 }) 29777 #endif 29778 29779 #ifdef __LITTLE_ENDIAN__ 29780 #define vst1q_u32(__p0, __p1) __extension__ ({ \ 29781 uint32x4_t __s1 = __p1; \ 29782 __builtin_neon_vst1q_v(__p0, (int8x16_t)__s1, 50); \ 29783 }) 29784 #else 29785 #define vst1q_u32(__p0, __p1) __extension__ ({ \ 29786 uint32x4_t __s1 = __p1; \ 29787 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 29788 __builtin_neon_vst1q_v(__p0, (int8x16_t)__rev1, 50); \ 29789 }) 29790 #endif 29791 29792 #ifdef __LITTLE_ENDIAN__ 29793 #define vst1q_u64(__p0, __p1) __extension__ ({ \ 29794 uint64x2_t __s1 = __p1; \ 29795 __builtin_neon_vst1q_v(__p0, (int8x16_t)__s1, 51); \ 29796 }) 29797 #else 29798 #define vst1q_u64(__p0, __p1) __extension__ ({ \ 29799 uint64x2_t __s1 = __p1; \ 29800 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 29801 __builtin_neon_vst1q_v(__p0, (int8x16_t)__rev1, 51); \ 29802 }) 29803 #endif 29804 29805 #ifdef __LITTLE_ENDIAN__ 29806 #define vst1q_u16(__p0, __p1) __extension__ ({ \ 29807 uint16x8_t __s1 = __p1; \ 29808 __builtin_neon_vst1q_v(__p0, (int8x16_t)__s1, 49); \ 29809 }) 29810 #else 29811 #define vst1q_u16(__p0, __p1) __extension__ ({ \ 29812 uint16x8_t __s1 = __p1; \ 29813 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 29814 __builtin_neon_vst1q_v(__p0, (int8x16_t)__rev1, 49); \ 29815 }) 29816 #endif 29817 29818 #ifdef __LITTLE_ENDIAN__ 29819 #define vst1q_s8(__p0, __p1) __extension__ ({ \ 29820 int8x16_t __s1 = __p1; \ 29821 __builtin_neon_vst1q_v(__p0, (int8x16_t)__s1, 32); \ 29822 }) 29823 #else 29824 #define vst1q_s8(__p0, __p1) __extension__ ({ \ 29825 int8x16_t __s1 = __p1; \ 29826 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 29827 __builtin_neon_vst1q_v(__p0, (int8x16_t)__rev1, 32); \ 29828 }) 29829 #endif 29830 29831 #ifdef __LITTLE_ENDIAN__ 29832 #define vst1q_f32(__p0, __p1) __extension__ ({ \ 29833 float32x4_t __s1 = __p1; \ 29834 __builtin_neon_vst1q_v(__p0, (int8x16_t)__s1, 41); \ 29835 }) 29836 #else 29837 #define vst1q_f32(__p0, __p1) __extension__ ({ \ 29838 float32x4_t __s1 = __p1; \ 29839 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 29840 __builtin_neon_vst1q_v(__p0, (int8x16_t)__rev1, 41); \ 29841 }) 29842 #endif 29843 29844 #ifdef __LITTLE_ENDIAN__ 29845 #define vst1q_s32(__p0, __p1) __extension__ ({ \ 29846 int32x4_t __s1 = __p1; \ 29847 __builtin_neon_vst1q_v(__p0, (int8x16_t)__s1, 34); \ 29848 }) 29849 #else 29850 #define vst1q_s32(__p0, __p1) __extension__ ({ \ 29851 int32x4_t __s1 = __p1; \ 29852 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 29853 __builtin_neon_vst1q_v(__p0, (int8x16_t)__rev1, 34); \ 29854 }) 29855 #endif 29856 29857 #ifdef __LITTLE_ENDIAN__ 29858 #define vst1q_s64(__p0, __p1) __extension__ ({ \ 29859 int64x2_t __s1 = __p1; \ 29860 __builtin_neon_vst1q_v(__p0, (int8x16_t)__s1, 35); \ 29861 }) 29862 #else 29863 #define vst1q_s64(__p0, __p1) __extension__ ({ \ 29864 int64x2_t __s1 = __p1; \ 29865 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 29866 __builtin_neon_vst1q_v(__p0, (int8x16_t)__rev1, 35); \ 29867 }) 29868 #endif 29869 29870 #ifdef __LITTLE_ENDIAN__ 29871 #define vst1q_s16(__p0, __p1) __extension__ ({ \ 29872 int16x8_t __s1 = __p1; \ 29873 __builtin_neon_vst1q_v(__p0, (int8x16_t)__s1, 33); \ 29874 }) 29875 #else 29876 #define vst1q_s16(__p0, __p1) __extension__ ({ \ 29877 int16x8_t __s1 = __p1; \ 29878 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 29879 __builtin_neon_vst1q_v(__p0, (int8x16_t)__rev1, 33); \ 29880 }) 29881 #endif 29882 29883 #ifdef __LITTLE_ENDIAN__ 29884 #define vst1_u8(__p0, __p1) __extension__ ({ \ 29885 uint8x8_t __s1 = __p1; \ 29886 __builtin_neon_vst1_v(__p0, (int8x8_t)__s1, 16); \ 29887 }) 29888 #else 29889 #define vst1_u8(__p0, __p1) __extension__ ({ \ 29890 uint8x8_t __s1 = __p1; \ 29891 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 29892 __builtin_neon_vst1_v(__p0, (int8x8_t)__rev1, 16); \ 29893 }) 29894 #endif 29895 29896 #ifdef __LITTLE_ENDIAN__ 29897 #define vst1_u32(__p0, __p1) __extension__ ({ \ 29898 uint32x2_t __s1 = __p1; \ 29899 __builtin_neon_vst1_v(__p0, (int8x8_t)__s1, 18); \ 29900 }) 29901 #else 29902 #define vst1_u32(__p0, __p1) __extension__ ({ \ 29903 uint32x2_t __s1 = __p1; \ 29904 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 29905 __builtin_neon_vst1_v(__p0, (int8x8_t)__rev1, 18); \ 29906 }) 29907 #endif 29908 29909 #define vst1_u64(__p0, __p1) __extension__ ({ \ 29910 uint64x1_t __s1 = __p1; \ 29911 __builtin_neon_vst1_v(__p0, (int8x8_t)__s1, 19); \ 29912 }) 29913 #ifdef __LITTLE_ENDIAN__ 29914 #define vst1_u16(__p0, __p1) __extension__ ({ \ 29915 uint16x4_t __s1 = __p1; \ 29916 __builtin_neon_vst1_v(__p0, (int8x8_t)__s1, 17); \ 29917 }) 29918 #else 29919 #define vst1_u16(__p0, __p1) __extension__ ({ \ 29920 uint16x4_t __s1 = __p1; \ 29921 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 29922 __builtin_neon_vst1_v(__p0, (int8x8_t)__rev1, 17); \ 29923 }) 29924 #endif 29925 29926 #ifdef __LITTLE_ENDIAN__ 29927 #define vst1_s8(__p0, __p1) __extension__ ({ \ 29928 int8x8_t __s1 = __p1; \ 29929 __builtin_neon_vst1_v(__p0, (int8x8_t)__s1, 0); \ 29930 }) 29931 #else 29932 #define vst1_s8(__p0, __p1) __extension__ ({ \ 29933 int8x8_t __s1 = __p1; \ 29934 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 29935 __builtin_neon_vst1_v(__p0, (int8x8_t)__rev1, 0); \ 29936 }) 29937 #endif 29938 29939 #ifdef __LITTLE_ENDIAN__ 29940 #define vst1_f32(__p0, __p1) __extension__ ({ \ 29941 float32x2_t __s1 = __p1; \ 29942 __builtin_neon_vst1_v(__p0, (int8x8_t)__s1, 9); \ 29943 }) 29944 #else 29945 #define vst1_f32(__p0, __p1) __extension__ ({ \ 29946 float32x2_t __s1 = __p1; \ 29947 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 29948 __builtin_neon_vst1_v(__p0, (int8x8_t)__rev1, 9); \ 29949 }) 29950 #endif 29951 29952 #ifdef __LITTLE_ENDIAN__ 29953 #define vst1_s32(__p0, __p1) __extension__ ({ \ 29954 int32x2_t __s1 = __p1; \ 29955 __builtin_neon_vst1_v(__p0, (int8x8_t)__s1, 2); \ 29956 }) 29957 #else 29958 #define vst1_s32(__p0, __p1) __extension__ ({ \ 29959 int32x2_t __s1 = __p1; \ 29960 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 29961 __builtin_neon_vst1_v(__p0, (int8x8_t)__rev1, 2); \ 29962 }) 29963 #endif 29964 29965 #define vst1_s64(__p0, __p1) __extension__ ({ \ 29966 int64x1_t __s1 = __p1; \ 29967 __builtin_neon_vst1_v(__p0, (int8x8_t)__s1, 3); \ 29968 }) 29969 #ifdef __LITTLE_ENDIAN__ 29970 #define vst1_s16(__p0, __p1) __extension__ ({ \ 29971 int16x4_t __s1 = __p1; \ 29972 __builtin_neon_vst1_v(__p0, (int8x8_t)__s1, 1); \ 29973 }) 29974 #else 29975 #define vst1_s16(__p0, __p1) __extension__ ({ \ 29976 int16x4_t __s1 = __p1; \ 29977 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 29978 __builtin_neon_vst1_v(__p0, (int8x8_t)__rev1, 1); \ 29979 }) 29980 #endif 29981 29982 #ifdef __LITTLE_ENDIAN__ 29983 #define vst1_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 29984 poly8x8_t __s1 = __p1; \ 29985 __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__s1, __p2, 4); \ 29986 }) 29987 #else 29988 #define vst1_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 29989 poly8x8_t __s1 = __p1; \ 29990 poly8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 29991 __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__rev1, __p2, 4); \ 29992 }) 29993 #endif 29994 29995 #ifdef __LITTLE_ENDIAN__ 29996 #define vst1_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 29997 poly16x4_t __s1 = __p1; \ 29998 __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__s1, __p2, 5); \ 29999 }) 30000 #else 30001 #define vst1_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 30002 poly16x4_t __s1 = __p1; \ 30003 poly16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 30004 __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__rev1, __p2, 5); \ 30005 }) 30006 #endif 30007 30008 #ifdef __LITTLE_ENDIAN__ 30009 #define vst1q_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 30010 poly8x16_t __s1 = __p1; \ 30011 __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__s1, __p2, 36); \ 30012 }) 30013 #else 30014 #define vst1q_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 30015 poly8x16_t __s1 = __p1; \ 30016 poly8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 30017 __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 36); \ 30018 }) 30019 #endif 30020 30021 #ifdef __LITTLE_ENDIAN__ 30022 #define vst1q_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 30023 poly16x8_t __s1 = __p1; \ 30024 __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__s1, __p2, 37); \ 30025 }) 30026 #else 30027 #define vst1q_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 30028 poly16x8_t __s1 = __p1; \ 30029 poly16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 30030 __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 37); \ 30031 }) 30032 #endif 30033 30034 #ifdef __LITTLE_ENDIAN__ 30035 #define vst1q_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 30036 uint8x16_t __s1 = __p1; \ 30037 __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__s1, __p2, 48); \ 30038 }) 30039 #else 30040 #define vst1q_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 30041 uint8x16_t __s1 = __p1; \ 30042 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 30043 __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 48); \ 30044 }) 30045 #endif 30046 30047 #ifdef __LITTLE_ENDIAN__ 30048 #define vst1q_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 30049 uint32x4_t __s1 = __p1; \ 30050 __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__s1, __p2, 50); \ 30051 }) 30052 #else 30053 #define vst1q_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 30054 uint32x4_t __s1 = __p1; \ 30055 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 30056 __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 50); \ 30057 }) 30058 #endif 30059 30060 #ifdef __LITTLE_ENDIAN__ 30061 #define vst1q_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 30062 uint64x2_t __s1 = __p1; \ 30063 __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__s1, __p2, 51); \ 30064 }) 30065 #else 30066 #define vst1q_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 30067 uint64x2_t __s1 = __p1; \ 30068 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 30069 __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 51); \ 30070 }) 30071 #endif 30072 30073 #ifdef __LITTLE_ENDIAN__ 30074 #define vst1q_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 30075 uint16x8_t __s1 = __p1; \ 30076 __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__s1, __p2, 49); \ 30077 }) 30078 #else 30079 #define vst1q_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 30080 uint16x8_t __s1 = __p1; \ 30081 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 30082 __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 49); \ 30083 }) 30084 #endif 30085 30086 #ifdef __LITTLE_ENDIAN__ 30087 #define vst1q_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 30088 int8x16_t __s1 = __p1; \ 30089 __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__s1, __p2, 32); \ 30090 }) 30091 #else 30092 #define vst1q_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 30093 int8x16_t __s1 = __p1; \ 30094 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 30095 __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 32); \ 30096 }) 30097 #endif 30098 30099 #ifdef __LITTLE_ENDIAN__ 30100 #define vst1q_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 30101 float32x4_t __s1 = __p1; \ 30102 __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__s1, __p2, 41); \ 30103 }) 30104 #else 30105 #define vst1q_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 30106 float32x4_t __s1 = __p1; \ 30107 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 30108 __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 41); \ 30109 }) 30110 #endif 30111 30112 #ifdef __LITTLE_ENDIAN__ 30113 #define vst1q_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 30114 int32x4_t __s1 = __p1; \ 30115 __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__s1, __p2, 34); \ 30116 }) 30117 #else 30118 #define vst1q_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 30119 int32x4_t __s1 = __p1; \ 30120 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 30121 __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 34); \ 30122 }) 30123 #endif 30124 30125 #ifdef __LITTLE_ENDIAN__ 30126 #define vst1q_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 30127 int64x2_t __s1 = __p1; \ 30128 __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__s1, __p2, 35); \ 30129 }) 30130 #else 30131 #define vst1q_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 30132 int64x2_t __s1 = __p1; \ 30133 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 30134 __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 35); \ 30135 }) 30136 #endif 30137 30138 #ifdef __LITTLE_ENDIAN__ 30139 #define vst1q_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 30140 int16x8_t __s1 = __p1; \ 30141 __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__s1, __p2, 33); \ 30142 }) 30143 #else 30144 #define vst1q_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 30145 int16x8_t __s1 = __p1; \ 30146 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 30147 __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 33); \ 30148 }) 30149 #endif 30150 30151 #ifdef __LITTLE_ENDIAN__ 30152 #define vst1_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 30153 uint8x8_t __s1 = __p1; \ 30154 __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__s1, __p2, 16); \ 30155 }) 30156 #else 30157 #define vst1_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 30158 uint8x8_t __s1 = __p1; \ 30159 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 30160 __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__rev1, __p2, 16); \ 30161 }) 30162 #endif 30163 30164 #ifdef __LITTLE_ENDIAN__ 30165 #define vst1_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 30166 uint32x2_t __s1 = __p1; \ 30167 __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__s1, __p2, 18); \ 30168 }) 30169 #else 30170 #define vst1_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 30171 uint32x2_t __s1 = __p1; \ 30172 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 30173 __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__rev1, __p2, 18); \ 30174 }) 30175 #endif 30176 30177 #define vst1_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 30178 uint64x1_t __s1 = __p1; \ 30179 __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__s1, __p2, 19); \ 30180 }) 30181 #ifdef __LITTLE_ENDIAN__ 30182 #define vst1_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 30183 uint16x4_t __s1 = __p1; \ 30184 __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__s1, __p2, 17); \ 30185 }) 30186 #else 30187 #define vst1_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 30188 uint16x4_t __s1 = __p1; \ 30189 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 30190 __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__rev1, __p2, 17); \ 30191 }) 30192 #endif 30193 30194 #ifdef __LITTLE_ENDIAN__ 30195 #define vst1_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 30196 int8x8_t __s1 = __p1; \ 30197 __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__s1, __p2, 0); \ 30198 }) 30199 #else 30200 #define vst1_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 30201 int8x8_t __s1 = __p1; \ 30202 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 30203 __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__rev1, __p2, 0); \ 30204 }) 30205 #endif 30206 30207 #ifdef __LITTLE_ENDIAN__ 30208 #define vst1_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 30209 float32x2_t __s1 = __p1; \ 30210 __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__s1, __p2, 9); \ 30211 }) 30212 #else 30213 #define vst1_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 30214 float32x2_t __s1 = __p1; \ 30215 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 30216 __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__rev1, __p2, 9); \ 30217 }) 30218 #endif 30219 30220 #ifdef __LITTLE_ENDIAN__ 30221 #define vst1_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 30222 int32x2_t __s1 = __p1; \ 30223 __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__s1, __p2, 2); \ 30224 }) 30225 #else 30226 #define vst1_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 30227 int32x2_t __s1 = __p1; \ 30228 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 30229 __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__rev1, __p2, 2); \ 30230 }) 30231 #endif 30232 30233 #define vst1_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 30234 int64x1_t __s1 = __p1; \ 30235 __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__s1, __p2, 3); \ 30236 }) 30237 #ifdef __LITTLE_ENDIAN__ 30238 #define vst1_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 30239 int16x4_t __s1 = __p1; \ 30240 __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__s1, __p2, 1); \ 30241 }) 30242 #else 30243 #define vst1_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 30244 int16x4_t __s1 = __p1; \ 30245 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 30246 __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__rev1, __p2, 1); \ 30247 }) 30248 #endif 30249 30250 #ifdef __LITTLE_ENDIAN__ 30251 #define vst1_p8_x2(__p0, __p1) __extension__ ({ \ 30252 poly8x8x2_t __s1 = __p1; \ 30253 __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 4); \ 30254 }) 30255 #else 30256 #define vst1_p8_x2(__p0, __p1) __extension__ ({ \ 30257 poly8x8x2_t __s1 = __p1; \ 30258 poly8x8x2_t __rev1; \ 30259 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 30260 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 30261 __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 4); \ 30262 }) 30263 #endif 30264 30265 #ifdef __LITTLE_ENDIAN__ 30266 #define vst1_p16_x2(__p0, __p1) __extension__ ({ \ 30267 poly16x4x2_t __s1 = __p1; \ 30268 __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 5); \ 30269 }) 30270 #else 30271 #define vst1_p16_x2(__p0, __p1) __extension__ ({ \ 30272 poly16x4x2_t __s1 = __p1; \ 30273 poly16x4x2_t __rev1; \ 30274 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 30275 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 30276 __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 5); \ 30277 }) 30278 #endif 30279 30280 #ifdef __LITTLE_ENDIAN__ 30281 #define vst1q_p8_x2(__p0, __p1) __extension__ ({ \ 30282 poly8x16x2_t __s1 = __p1; \ 30283 __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 36); \ 30284 }) 30285 #else 30286 #define vst1q_p8_x2(__p0, __p1) __extension__ ({ \ 30287 poly8x16x2_t __s1 = __p1; \ 30288 poly8x16x2_t __rev1; \ 30289 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 30290 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 30291 __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 36); \ 30292 }) 30293 #endif 30294 30295 #ifdef __LITTLE_ENDIAN__ 30296 #define vst1q_p16_x2(__p0, __p1) __extension__ ({ \ 30297 poly16x8x2_t __s1 = __p1; \ 30298 __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 37); \ 30299 }) 30300 #else 30301 #define vst1q_p16_x2(__p0, __p1) __extension__ ({ \ 30302 poly16x8x2_t __s1 = __p1; \ 30303 poly16x8x2_t __rev1; \ 30304 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 30305 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 30306 __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 37); \ 30307 }) 30308 #endif 30309 30310 #ifdef __LITTLE_ENDIAN__ 30311 #define vst1q_u8_x2(__p0, __p1) __extension__ ({ \ 30312 uint8x16x2_t __s1 = __p1; \ 30313 __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 48); \ 30314 }) 30315 #else 30316 #define vst1q_u8_x2(__p0, __p1) __extension__ ({ \ 30317 uint8x16x2_t __s1 = __p1; \ 30318 uint8x16x2_t __rev1; \ 30319 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 30320 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 30321 __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 48); \ 30322 }) 30323 #endif 30324 30325 #ifdef __LITTLE_ENDIAN__ 30326 #define vst1q_u32_x2(__p0, __p1) __extension__ ({ \ 30327 uint32x4x2_t __s1 = __p1; \ 30328 __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 50); \ 30329 }) 30330 #else 30331 #define vst1q_u32_x2(__p0, __p1) __extension__ ({ \ 30332 uint32x4x2_t __s1 = __p1; \ 30333 uint32x4x2_t __rev1; \ 30334 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 30335 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 30336 __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 50); \ 30337 }) 30338 #endif 30339 30340 #ifdef __LITTLE_ENDIAN__ 30341 #define vst1q_u64_x2(__p0, __p1) __extension__ ({ \ 30342 uint64x2x2_t __s1 = __p1; \ 30343 __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 51); \ 30344 }) 30345 #else 30346 #define vst1q_u64_x2(__p0, __p1) __extension__ ({ \ 30347 uint64x2x2_t __s1 = __p1; \ 30348 uint64x2x2_t __rev1; \ 30349 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 30350 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 30351 __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 51); \ 30352 }) 30353 #endif 30354 30355 #ifdef __LITTLE_ENDIAN__ 30356 #define vst1q_u16_x2(__p0, __p1) __extension__ ({ \ 30357 uint16x8x2_t __s1 = __p1; \ 30358 __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 49); \ 30359 }) 30360 #else 30361 #define vst1q_u16_x2(__p0, __p1) __extension__ ({ \ 30362 uint16x8x2_t __s1 = __p1; \ 30363 uint16x8x2_t __rev1; \ 30364 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 30365 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 30366 __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 49); \ 30367 }) 30368 #endif 30369 30370 #ifdef __LITTLE_ENDIAN__ 30371 #define vst1q_s8_x2(__p0, __p1) __extension__ ({ \ 30372 int8x16x2_t __s1 = __p1; \ 30373 __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 32); \ 30374 }) 30375 #else 30376 #define vst1q_s8_x2(__p0, __p1) __extension__ ({ \ 30377 int8x16x2_t __s1 = __p1; \ 30378 int8x16x2_t __rev1; \ 30379 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 30380 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 30381 __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 32); \ 30382 }) 30383 #endif 30384 30385 #ifdef __LITTLE_ENDIAN__ 30386 #define vst1q_f32_x2(__p0, __p1) __extension__ ({ \ 30387 float32x4x2_t __s1 = __p1; \ 30388 __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 41); \ 30389 }) 30390 #else 30391 #define vst1q_f32_x2(__p0, __p1) __extension__ ({ \ 30392 float32x4x2_t __s1 = __p1; \ 30393 float32x4x2_t __rev1; \ 30394 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 30395 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 30396 __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 41); \ 30397 }) 30398 #endif 30399 30400 #ifdef __LITTLE_ENDIAN__ 30401 #define vst1q_s32_x2(__p0, __p1) __extension__ ({ \ 30402 int32x4x2_t __s1 = __p1; \ 30403 __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 34); \ 30404 }) 30405 #else 30406 #define vst1q_s32_x2(__p0, __p1) __extension__ ({ \ 30407 int32x4x2_t __s1 = __p1; \ 30408 int32x4x2_t __rev1; \ 30409 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 30410 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 30411 __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 34); \ 30412 }) 30413 #endif 30414 30415 #ifdef __LITTLE_ENDIAN__ 30416 #define vst1q_s64_x2(__p0, __p1) __extension__ ({ \ 30417 int64x2x2_t __s1 = __p1; \ 30418 __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 35); \ 30419 }) 30420 #else 30421 #define vst1q_s64_x2(__p0, __p1) __extension__ ({ \ 30422 int64x2x2_t __s1 = __p1; \ 30423 int64x2x2_t __rev1; \ 30424 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 30425 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 30426 __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 35); \ 30427 }) 30428 #endif 30429 30430 #ifdef __LITTLE_ENDIAN__ 30431 #define vst1q_s16_x2(__p0, __p1) __extension__ ({ \ 30432 int16x8x2_t __s1 = __p1; \ 30433 __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 33); \ 30434 }) 30435 #else 30436 #define vst1q_s16_x2(__p0, __p1) __extension__ ({ \ 30437 int16x8x2_t __s1 = __p1; \ 30438 int16x8x2_t __rev1; \ 30439 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 30440 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 30441 __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 33); \ 30442 }) 30443 #endif 30444 30445 #ifdef __LITTLE_ENDIAN__ 30446 #define vst1_u8_x2(__p0, __p1) __extension__ ({ \ 30447 uint8x8x2_t __s1 = __p1; \ 30448 __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 16); \ 30449 }) 30450 #else 30451 #define vst1_u8_x2(__p0, __p1) __extension__ ({ \ 30452 uint8x8x2_t __s1 = __p1; \ 30453 uint8x8x2_t __rev1; \ 30454 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 30455 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 30456 __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 16); \ 30457 }) 30458 #endif 30459 30460 #ifdef __LITTLE_ENDIAN__ 30461 #define vst1_u32_x2(__p0, __p1) __extension__ ({ \ 30462 uint32x2x2_t __s1 = __p1; \ 30463 __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 18); \ 30464 }) 30465 #else 30466 #define vst1_u32_x2(__p0, __p1) __extension__ ({ \ 30467 uint32x2x2_t __s1 = __p1; \ 30468 uint32x2x2_t __rev1; \ 30469 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 30470 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 30471 __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 18); \ 30472 }) 30473 #endif 30474 30475 #define vst1_u64_x2(__p0, __p1) __extension__ ({ \ 30476 uint64x1x2_t __s1 = __p1; \ 30477 __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 19); \ 30478 }) 30479 #ifdef __LITTLE_ENDIAN__ 30480 #define vst1_u16_x2(__p0, __p1) __extension__ ({ \ 30481 uint16x4x2_t __s1 = __p1; \ 30482 __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 17); \ 30483 }) 30484 #else 30485 #define vst1_u16_x2(__p0, __p1) __extension__ ({ \ 30486 uint16x4x2_t __s1 = __p1; \ 30487 uint16x4x2_t __rev1; \ 30488 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 30489 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 30490 __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 17); \ 30491 }) 30492 #endif 30493 30494 #ifdef __LITTLE_ENDIAN__ 30495 #define vst1_s8_x2(__p0, __p1) __extension__ ({ \ 30496 int8x8x2_t __s1 = __p1; \ 30497 __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 0); \ 30498 }) 30499 #else 30500 #define vst1_s8_x2(__p0, __p1) __extension__ ({ \ 30501 int8x8x2_t __s1 = __p1; \ 30502 int8x8x2_t __rev1; \ 30503 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 30504 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 30505 __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 0); \ 30506 }) 30507 #endif 30508 30509 #ifdef __LITTLE_ENDIAN__ 30510 #define vst1_f32_x2(__p0, __p1) __extension__ ({ \ 30511 float32x2x2_t __s1 = __p1; \ 30512 __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 9); \ 30513 }) 30514 #else 30515 #define vst1_f32_x2(__p0, __p1) __extension__ ({ \ 30516 float32x2x2_t __s1 = __p1; \ 30517 float32x2x2_t __rev1; \ 30518 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 30519 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 30520 __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 9); \ 30521 }) 30522 #endif 30523 30524 #ifdef __LITTLE_ENDIAN__ 30525 #define vst1_s32_x2(__p0, __p1) __extension__ ({ \ 30526 int32x2x2_t __s1 = __p1; \ 30527 __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 2); \ 30528 }) 30529 #else 30530 #define vst1_s32_x2(__p0, __p1) __extension__ ({ \ 30531 int32x2x2_t __s1 = __p1; \ 30532 int32x2x2_t __rev1; \ 30533 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 30534 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 30535 __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 2); \ 30536 }) 30537 #endif 30538 30539 #define vst1_s64_x2(__p0, __p1) __extension__ ({ \ 30540 int64x1x2_t __s1 = __p1; \ 30541 __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 3); \ 30542 }) 30543 #ifdef __LITTLE_ENDIAN__ 30544 #define vst1_s16_x2(__p0, __p1) __extension__ ({ \ 30545 int16x4x2_t __s1 = __p1; \ 30546 __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 1); \ 30547 }) 30548 #else 30549 #define vst1_s16_x2(__p0, __p1) __extension__ ({ \ 30550 int16x4x2_t __s1 = __p1; \ 30551 int16x4x2_t __rev1; \ 30552 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 30553 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 30554 __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 1); \ 30555 }) 30556 #endif 30557 30558 #ifdef __LITTLE_ENDIAN__ 30559 #define vst1_p8_x3(__p0, __p1) __extension__ ({ \ 30560 poly8x8x3_t __s1 = __p1; \ 30561 __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 4); \ 30562 }) 30563 #else 30564 #define vst1_p8_x3(__p0, __p1) __extension__ ({ \ 30565 poly8x8x3_t __s1 = __p1; \ 30566 poly8x8x3_t __rev1; \ 30567 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 30568 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 30569 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 30570 __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 4); \ 30571 }) 30572 #endif 30573 30574 #ifdef __LITTLE_ENDIAN__ 30575 #define vst1_p16_x3(__p0, __p1) __extension__ ({ \ 30576 poly16x4x3_t __s1 = __p1; \ 30577 __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 5); \ 30578 }) 30579 #else 30580 #define vst1_p16_x3(__p0, __p1) __extension__ ({ \ 30581 poly16x4x3_t __s1 = __p1; \ 30582 poly16x4x3_t __rev1; \ 30583 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 30584 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 30585 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 30586 __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 5); \ 30587 }) 30588 #endif 30589 30590 #ifdef __LITTLE_ENDIAN__ 30591 #define vst1q_p8_x3(__p0, __p1) __extension__ ({ \ 30592 poly8x16x3_t __s1 = __p1; \ 30593 __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 36); \ 30594 }) 30595 #else 30596 #define vst1q_p8_x3(__p0, __p1) __extension__ ({ \ 30597 poly8x16x3_t __s1 = __p1; \ 30598 poly8x16x3_t __rev1; \ 30599 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 30600 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 30601 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 30602 __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 36); \ 30603 }) 30604 #endif 30605 30606 #ifdef __LITTLE_ENDIAN__ 30607 #define vst1q_p16_x3(__p0, __p1) __extension__ ({ \ 30608 poly16x8x3_t __s1 = __p1; \ 30609 __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 37); \ 30610 }) 30611 #else 30612 #define vst1q_p16_x3(__p0, __p1) __extension__ ({ \ 30613 poly16x8x3_t __s1 = __p1; \ 30614 poly16x8x3_t __rev1; \ 30615 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 30616 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 30617 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 30618 __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 37); \ 30619 }) 30620 #endif 30621 30622 #ifdef __LITTLE_ENDIAN__ 30623 #define vst1q_u8_x3(__p0, __p1) __extension__ ({ \ 30624 uint8x16x3_t __s1 = __p1; \ 30625 __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 48); \ 30626 }) 30627 #else 30628 #define vst1q_u8_x3(__p0, __p1) __extension__ ({ \ 30629 uint8x16x3_t __s1 = __p1; \ 30630 uint8x16x3_t __rev1; \ 30631 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 30632 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 30633 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 30634 __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 48); \ 30635 }) 30636 #endif 30637 30638 #ifdef __LITTLE_ENDIAN__ 30639 #define vst1q_u32_x3(__p0, __p1) __extension__ ({ \ 30640 uint32x4x3_t __s1 = __p1; \ 30641 __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 50); \ 30642 }) 30643 #else 30644 #define vst1q_u32_x3(__p0, __p1) __extension__ ({ \ 30645 uint32x4x3_t __s1 = __p1; \ 30646 uint32x4x3_t __rev1; \ 30647 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 30648 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 30649 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 30650 __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 50); \ 30651 }) 30652 #endif 30653 30654 #ifdef __LITTLE_ENDIAN__ 30655 #define vst1q_u64_x3(__p0, __p1) __extension__ ({ \ 30656 uint64x2x3_t __s1 = __p1; \ 30657 __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 51); \ 30658 }) 30659 #else 30660 #define vst1q_u64_x3(__p0, __p1) __extension__ ({ \ 30661 uint64x2x3_t __s1 = __p1; \ 30662 uint64x2x3_t __rev1; \ 30663 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 30664 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 30665 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 30666 __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 51); \ 30667 }) 30668 #endif 30669 30670 #ifdef __LITTLE_ENDIAN__ 30671 #define vst1q_u16_x3(__p0, __p1) __extension__ ({ \ 30672 uint16x8x3_t __s1 = __p1; \ 30673 __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 49); \ 30674 }) 30675 #else 30676 #define vst1q_u16_x3(__p0, __p1) __extension__ ({ \ 30677 uint16x8x3_t __s1 = __p1; \ 30678 uint16x8x3_t __rev1; \ 30679 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 30680 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 30681 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 30682 __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 49); \ 30683 }) 30684 #endif 30685 30686 #ifdef __LITTLE_ENDIAN__ 30687 #define vst1q_s8_x3(__p0, __p1) __extension__ ({ \ 30688 int8x16x3_t __s1 = __p1; \ 30689 __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 32); \ 30690 }) 30691 #else 30692 #define vst1q_s8_x3(__p0, __p1) __extension__ ({ \ 30693 int8x16x3_t __s1 = __p1; \ 30694 int8x16x3_t __rev1; \ 30695 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 30696 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 30697 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 30698 __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 32); \ 30699 }) 30700 #endif 30701 30702 #ifdef __LITTLE_ENDIAN__ 30703 #define vst1q_f32_x3(__p0, __p1) __extension__ ({ \ 30704 float32x4x3_t __s1 = __p1; \ 30705 __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 41); \ 30706 }) 30707 #else 30708 #define vst1q_f32_x3(__p0, __p1) __extension__ ({ \ 30709 float32x4x3_t __s1 = __p1; \ 30710 float32x4x3_t __rev1; \ 30711 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 30712 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 30713 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 30714 __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 41); \ 30715 }) 30716 #endif 30717 30718 #ifdef __LITTLE_ENDIAN__ 30719 #define vst1q_s32_x3(__p0, __p1) __extension__ ({ \ 30720 int32x4x3_t __s1 = __p1; \ 30721 __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 34); \ 30722 }) 30723 #else 30724 #define vst1q_s32_x3(__p0, __p1) __extension__ ({ \ 30725 int32x4x3_t __s1 = __p1; \ 30726 int32x4x3_t __rev1; \ 30727 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 30728 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 30729 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 30730 __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 34); \ 30731 }) 30732 #endif 30733 30734 #ifdef __LITTLE_ENDIAN__ 30735 #define vst1q_s64_x3(__p0, __p1) __extension__ ({ \ 30736 int64x2x3_t __s1 = __p1; \ 30737 __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 35); \ 30738 }) 30739 #else 30740 #define vst1q_s64_x3(__p0, __p1) __extension__ ({ \ 30741 int64x2x3_t __s1 = __p1; \ 30742 int64x2x3_t __rev1; \ 30743 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 30744 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 30745 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 30746 __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 35); \ 30747 }) 30748 #endif 30749 30750 #ifdef __LITTLE_ENDIAN__ 30751 #define vst1q_s16_x3(__p0, __p1) __extension__ ({ \ 30752 int16x8x3_t __s1 = __p1; \ 30753 __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 33); \ 30754 }) 30755 #else 30756 #define vst1q_s16_x3(__p0, __p1) __extension__ ({ \ 30757 int16x8x3_t __s1 = __p1; \ 30758 int16x8x3_t __rev1; \ 30759 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 30760 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 30761 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 30762 __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 33); \ 30763 }) 30764 #endif 30765 30766 #ifdef __LITTLE_ENDIAN__ 30767 #define vst1_u8_x3(__p0, __p1) __extension__ ({ \ 30768 uint8x8x3_t __s1 = __p1; \ 30769 __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 16); \ 30770 }) 30771 #else 30772 #define vst1_u8_x3(__p0, __p1) __extension__ ({ \ 30773 uint8x8x3_t __s1 = __p1; \ 30774 uint8x8x3_t __rev1; \ 30775 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 30776 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 30777 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 30778 __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 16); \ 30779 }) 30780 #endif 30781 30782 #ifdef __LITTLE_ENDIAN__ 30783 #define vst1_u32_x3(__p0, __p1) __extension__ ({ \ 30784 uint32x2x3_t __s1 = __p1; \ 30785 __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 18); \ 30786 }) 30787 #else 30788 #define vst1_u32_x3(__p0, __p1) __extension__ ({ \ 30789 uint32x2x3_t __s1 = __p1; \ 30790 uint32x2x3_t __rev1; \ 30791 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 30792 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 30793 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 30794 __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 18); \ 30795 }) 30796 #endif 30797 30798 #define vst1_u64_x3(__p0, __p1) __extension__ ({ \ 30799 uint64x1x3_t __s1 = __p1; \ 30800 __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 19); \ 30801 }) 30802 #ifdef __LITTLE_ENDIAN__ 30803 #define vst1_u16_x3(__p0, __p1) __extension__ ({ \ 30804 uint16x4x3_t __s1 = __p1; \ 30805 __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 17); \ 30806 }) 30807 #else 30808 #define vst1_u16_x3(__p0, __p1) __extension__ ({ \ 30809 uint16x4x3_t __s1 = __p1; \ 30810 uint16x4x3_t __rev1; \ 30811 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 30812 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 30813 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 30814 __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 17); \ 30815 }) 30816 #endif 30817 30818 #ifdef __LITTLE_ENDIAN__ 30819 #define vst1_s8_x3(__p0, __p1) __extension__ ({ \ 30820 int8x8x3_t __s1 = __p1; \ 30821 __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 0); \ 30822 }) 30823 #else 30824 #define vst1_s8_x3(__p0, __p1) __extension__ ({ \ 30825 int8x8x3_t __s1 = __p1; \ 30826 int8x8x3_t __rev1; \ 30827 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 30828 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 30829 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 30830 __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 0); \ 30831 }) 30832 #endif 30833 30834 #ifdef __LITTLE_ENDIAN__ 30835 #define vst1_f32_x3(__p0, __p1) __extension__ ({ \ 30836 float32x2x3_t __s1 = __p1; \ 30837 __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 9); \ 30838 }) 30839 #else 30840 #define vst1_f32_x3(__p0, __p1) __extension__ ({ \ 30841 float32x2x3_t __s1 = __p1; \ 30842 float32x2x3_t __rev1; \ 30843 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 30844 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 30845 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 30846 __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 9); \ 30847 }) 30848 #endif 30849 30850 #ifdef __LITTLE_ENDIAN__ 30851 #define vst1_s32_x3(__p0, __p1) __extension__ ({ \ 30852 int32x2x3_t __s1 = __p1; \ 30853 __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 2); \ 30854 }) 30855 #else 30856 #define vst1_s32_x3(__p0, __p1) __extension__ ({ \ 30857 int32x2x3_t __s1 = __p1; \ 30858 int32x2x3_t __rev1; \ 30859 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 30860 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 30861 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 30862 __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 2); \ 30863 }) 30864 #endif 30865 30866 #define vst1_s64_x3(__p0, __p1) __extension__ ({ \ 30867 int64x1x3_t __s1 = __p1; \ 30868 __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 3); \ 30869 }) 30870 #ifdef __LITTLE_ENDIAN__ 30871 #define vst1_s16_x3(__p0, __p1) __extension__ ({ \ 30872 int16x4x3_t __s1 = __p1; \ 30873 __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 1); \ 30874 }) 30875 #else 30876 #define vst1_s16_x3(__p0, __p1) __extension__ ({ \ 30877 int16x4x3_t __s1 = __p1; \ 30878 int16x4x3_t __rev1; \ 30879 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 30880 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 30881 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 30882 __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 1); \ 30883 }) 30884 #endif 30885 30886 #ifdef __LITTLE_ENDIAN__ 30887 #define vst1_p8_x4(__p0, __p1) __extension__ ({ \ 30888 poly8x8x4_t __s1 = __p1; \ 30889 __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 4); \ 30890 }) 30891 #else 30892 #define vst1_p8_x4(__p0, __p1) __extension__ ({ \ 30893 poly8x8x4_t __s1 = __p1; \ 30894 poly8x8x4_t __rev1; \ 30895 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 30896 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 30897 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 30898 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 30899 __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 4); \ 30900 }) 30901 #endif 30902 30903 #ifdef __LITTLE_ENDIAN__ 30904 #define vst1_p16_x4(__p0, __p1) __extension__ ({ \ 30905 poly16x4x4_t __s1 = __p1; \ 30906 __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 5); \ 30907 }) 30908 #else 30909 #define vst1_p16_x4(__p0, __p1) __extension__ ({ \ 30910 poly16x4x4_t __s1 = __p1; \ 30911 poly16x4x4_t __rev1; \ 30912 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 30913 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 30914 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 30915 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \ 30916 __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 5); \ 30917 }) 30918 #endif 30919 30920 #ifdef __LITTLE_ENDIAN__ 30921 #define vst1q_p8_x4(__p0, __p1) __extension__ ({ \ 30922 poly8x16x4_t __s1 = __p1; \ 30923 __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 36); \ 30924 }) 30925 #else 30926 #define vst1q_p8_x4(__p0, __p1) __extension__ ({ \ 30927 poly8x16x4_t __s1 = __p1; \ 30928 poly8x16x4_t __rev1; \ 30929 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 30930 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 30931 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 30932 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 30933 __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 36); \ 30934 }) 30935 #endif 30936 30937 #ifdef __LITTLE_ENDIAN__ 30938 #define vst1q_p16_x4(__p0, __p1) __extension__ ({ \ 30939 poly16x8x4_t __s1 = __p1; \ 30940 __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 37); \ 30941 }) 30942 #else 30943 #define vst1q_p16_x4(__p0, __p1) __extension__ ({ \ 30944 poly16x8x4_t __s1 = __p1; \ 30945 poly16x8x4_t __rev1; \ 30946 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 30947 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 30948 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 30949 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 30950 __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 37); \ 30951 }) 30952 #endif 30953 30954 #ifdef __LITTLE_ENDIAN__ 30955 #define vst1q_u8_x4(__p0, __p1) __extension__ ({ \ 30956 uint8x16x4_t __s1 = __p1; \ 30957 __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 48); \ 30958 }) 30959 #else 30960 #define vst1q_u8_x4(__p0, __p1) __extension__ ({ \ 30961 uint8x16x4_t __s1 = __p1; \ 30962 uint8x16x4_t __rev1; \ 30963 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 30964 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 30965 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 30966 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 30967 __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 48); \ 30968 }) 30969 #endif 30970 30971 #ifdef __LITTLE_ENDIAN__ 30972 #define vst1q_u32_x4(__p0, __p1) __extension__ ({ \ 30973 uint32x4x4_t __s1 = __p1; \ 30974 __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 50); \ 30975 }) 30976 #else 30977 #define vst1q_u32_x4(__p0, __p1) __extension__ ({ \ 30978 uint32x4x4_t __s1 = __p1; \ 30979 uint32x4x4_t __rev1; \ 30980 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 30981 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 30982 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 30983 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \ 30984 __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 50); \ 30985 }) 30986 #endif 30987 30988 #ifdef __LITTLE_ENDIAN__ 30989 #define vst1q_u64_x4(__p0, __p1) __extension__ ({ \ 30990 uint64x2x4_t __s1 = __p1; \ 30991 __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 51); \ 30992 }) 30993 #else 30994 #define vst1q_u64_x4(__p0, __p1) __extension__ ({ \ 30995 uint64x2x4_t __s1 = __p1; \ 30996 uint64x2x4_t __rev1; \ 30997 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 30998 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 30999 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 31000 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \ 31001 __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 51); \ 31002 }) 31003 #endif 31004 31005 #ifdef __LITTLE_ENDIAN__ 31006 #define vst1q_u16_x4(__p0, __p1) __extension__ ({ \ 31007 uint16x8x4_t __s1 = __p1; \ 31008 __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 49); \ 31009 }) 31010 #else 31011 #define vst1q_u16_x4(__p0, __p1) __extension__ ({ \ 31012 uint16x8x4_t __s1 = __p1; \ 31013 uint16x8x4_t __rev1; \ 31014 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 31015 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 31016 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 31017 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 31018 __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 49); \ 31019 }) 31020 #endif 31021 31022 #ifdef __LITTLE_ENDIAN__ 31023 #define vst1q_s8_x4(__p0, __p1) __extension__ ({ \ 31024 int8x16x4_t __s1 = __p1; \ 31025 __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 32); \ 31026 }) 31027 #else 31028 #define vst1q_s8_x4(__p0, __p1) __extension__ ({ \ 31029 int8x16x4_t __s1 = __p1; \ 31030 int8x16x4_t __rev1; \ 31031 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 31032 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 31033 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 31034 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 31035 __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 32); \ 31036 }) 31037 #endif 31038 31039 #ifdef __LITTLE_ENDIAN__ 31040 #define vst1q_f32_x4(__p0, __p1) __extension__ ({ \ 31041 float32x4x4_t __s1 = __p1; \ 31042 __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 41); \ 31043 }) 31044 #else 31045 #define vst1q_f32_x4(__p0, __p1) __extension__ ({ \ 31046 float32x4x4_t __s1 = __p1; \ 31047 float32x4x4_t __rev1; \ 31048 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 31049 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 31050 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 31051 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \ 31052 __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 41); \ 31053 }) 31054 #endif 31055 31056 #ifdef __LITTLE_ENDIAN__ 31057 #define vst1q_s32_x4(__p0, __p1) __extension__ ({ \ 31058 int32x4x4_t __s1 = __p1; \ 31059 __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 34); \ 31060 }) 31061 #else 31062 #define vst1q_s32_x4(__p0, __p1) __extension__ ({ \ 31063 int32x4x4_t __s1 = __p1; \ 31064 int32x4x4_t __rev1; \ 31065 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 31066 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 31067 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 31068 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \ 31069 __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 34); \ 31070 }) 31071 #endif 31072 31073 #ifdef __LITTLE_ENDIAN__ 31074 #define vst1q_s64_x4(__p0, __p1) __extension__ ({ \ 31075 int64x2x4_t __s1 = __p1; \ 31076 __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 35); \ 31077 }) 31078 #else 31079 #define vst1q_s64_x4(__p0, __p1) __extension__ ({ \ 31080 int64x2x4_t __s1 = __p1; \ 31081 int64x2x4_t __rev1; \ 31082 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 31083 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 31084 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 31085 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \ 31086 __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 35); \ 31087 }) 31088 #endif 31089 31090 #ifdef __LITTLE_ENDIAN__ 31091 #define vst1q_s16_x4(__p0, __p1) __extension__ ({ \ 31092 int16x8x4_t __s1 = __p1; \ 31093 __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 33); \ 31094 }) 31095 #else 31096 #define vst1q_s16_x4(__p0, __p1) __extension__ ({ \ 31097 int16x8x4_t __s1 = __p1; \ 31098 int16x8x4_t __rev1; \ 31099 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 31100 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 31101 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 31102 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 31103 __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 33); \ 31104 }) 31105 #endif 31106 31107 #ifdef __LITTLE_ENDIAN__ 31108 #define vst1_u8_x4(__p0, __p1) __extension__ ({ \ 31109 uint8x8x4_t __s1 = __p1; \ 31110 __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 16); \ 31111 }) 31112 #else 31113 #define vst1_u8_x4(__p0, __p1) __extension__ ({ \ 31114 uint8x8x4_t __s1 = __p1; \ 31115 uint8x8x4_t __rev1; \ 31116 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 31117 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 31118 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 31119 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 31120 __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 16); \ 31121 }) 31122 #endif 31123 31124 #ifdef __LITTLE_ENDIAN__ 31125 #define vst1_u32_x4(__p0, __p1) __extension__ ({ \ 31126 uint32x2x4_t __s1 = __p1; \ 31127 __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 18); \ 31128 }) 31129 #else 31130 #define vst1_u32_x4(__p0, __p1) __extension__ ({ \ 31131 uint32x2x4_t __s1 = __p1; \ 31132 uint32x2x4_t __rev1; \ 31133 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 31134 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 31135 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 31136 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \ 31137 __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 18); \ 31138 }) 31139 #endif 31140 31141 #define vst1_u64_x4(__p0, __p1) __extension__ ({ \ 31142 uint64x1x4_t __s1 = __p1; \ 31143 __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 19); \ 31144 }) 31145 #ifdef __LITTLE_ENDIAN__ 31146 #define vst1_u16_x4(__p0, __p1) __extension__ ({ \ 31147 uint16x4x4_t __s1 = __p1; \ 31148 __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 17); \ 31149 }) 31150 #else 31151 #define vst1_u16_x4(__p0, __p1) __extension__ ({ \ 31152 uint16x4x4_t __s1 = __p1; \ 31153 uint16x4x4_t __rev1; \ 31154 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 31155 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 31156 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 31157 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \ 31158 __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 17); \ 31159 }) 31160 #endif 31161 31162 #ifdef __LITTLE_ENDIAN__ 31163 #define vst1_s8_x4(__p0, __p1) __extension__ ({ \ 31164 int8x8x4_t __s1 = __p1; \ 31165 __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 0); \ 31166 }) 31167 #else 31168 #define vst1_s8_x4(__p0, __p1) __extension__ ({ \ 31169 int8x8x4_t __s1 = __p1; \ 31170 int8x8x4_t __rev1; \ 31171 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 31172 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 31173 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 31174 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 31175 __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 0); \ 31176 }) 31177 #endif 31178 31179 #ifdef __LITTLE_ENDIAN__ 31180 #define vst1_f32_x4(__p0, __p1) __extension__ ({ \ 31181 float32x2x4_t __s1 = __p1; \ 31182 __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 9); \ 31183 }) 31184 #else 31185 #define vst1_f32_x4(__p0, __p1) __extension__ ({ \ 31186 float32x2x4_t __s1 = __p1; \ 31187 float32x2x4_t __rev1; \ 31188 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 31189 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 31190 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 31191 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \ 31192 __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 9); \ 31193 }) 31194 #endif 31195 31196 #ifdef __LITTLE_ENDIAN__ 31197 #define vst1_s32_x4(__p0, __p1) __extension__ ({ \ 31198 int32x2x4_t __s1 = __p1; \ 31199 __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 2); \ 31200 }) 31201 #else 31202 #define vst1_s32_x4(__p0, __p1) __extension__ ({ \ 31203 int32x2x4_t __s1 = __p1; \ 31204 int32x2x4_t __rev1; \ 31205 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 31206 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 31207 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 31208 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \ 31209 __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 2); \ 31210 }) 31211 #endif 31212 31213 #define vst1_s64_x4(__p0, __p1) __extension__ ({ \ 31214 int64x1x4_t __s1 = __p1; \ 31215 __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 3); \ 31216 }) 31217 #ifdef __LITTLE_ENDIAN__ 31218 #define vst1_s16_x4(__p0, __p1) __extension__ ({ \ 31219 int16x4x4_t __s1 = __p1; \ 31220 __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 1); \ 31221 }) 31222 #else 31223 #define vst1_s16_x4(__p0, __p1) __extension__ ({ \ 31224 int16x4x4_t __s1 = __p1; \ 31225 int16x4x4_t __rev1; \ 31226 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 31227 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 31228 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 31229 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \ 31230 __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 1); \ 31231 }) 31232 #endif 31233 31234 #ifdef __LITTLE_ENDIAN__ 31235 #define vst2_p8(__p0, __p1) __extension__ ({ \ 31236 poly8x8x2_t __s1 = __p1; \ 31237 __builtin_neon_vst2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 4); \ 31238 }) 31239 #else 31240 #define vst2_p8(__p0, __p1) __extension__ ({ \ 31241 poly8x8x2_t __s1 = __p1; \ 31242 poly8x8x2_t __rev1; \ 31243 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 31244 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 31245 __builtin_neon_vst2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 4); \ 31246 }) 31247 #endif 31248 31249 #ifdef __LITTLE_ENDIAN__ 31250 #define vst2_p16(__p0, __p1) __extension__ ({ \ 31251 poly16x4x2_t __s1 = __p1; \ 31252 __builtin_neon_vst2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 5); \ 31253 }) 31254 #else 31255 #define vst2_p16(__p0, __p1) __extension__ ({ \ 31256 poly16x4x2_t __s1 = __p1; \ 31257 poly16x4x2_t __rev1; \ 31258 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 31259 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 31260 __builtin_neon_vst2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 5); \ 31261 }) 31262 #endif 31263 31264 #ifdef __LITTLE_ENDIAN__ 31265 #define vst2q_p8(__p0, __p1) __extension__ ({ \ 31266 poly8x16x2_t __s1 = __p1; \ 31267 __builtin_neon_vst2q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 36); \ 31268 }) 31269 #else 31270 #define vst2q_p8(__p0, __p1) __extension__ ({ \ 31271 poly8x16x2_t __s1 = __p1; \ 31272 poly8x16x2_t __rev1; \ 31273 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 31274 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 31275 __builtin_neon_vst2q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 36); \ 31276 }) 31277 #endif 31278 31279 #ifdef __LITTLE_ENDIAN__ 31280 #define vst2q_p16(__p0, __p1) __extension__ ({ \ 31281 poly16x8x2_t __s1 = __p1; \ 31282 __builtin_neon_vst2q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 37); \ 31283 }) 31284 #else 31285 #define vst2q_p16(__p0, __p1) __extension__ ({ \ 31286 poly16x8x2_t __s1 = __p1; \ 31287 poly16x8x2_t __rev1; \ 31288 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 31289 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 31290 __builtin_neon_vst2q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 37); \ 31291 }) 31292 #endif 31293 31294 #ifdef __LITTLE_ENDIAN__ 31295 #define vst2q_u8(__p0, __p1) __extension__ ({ \ 31296 uint8x16x2_t __s1 = __p1; \ 31297 __builtin_neon_vst2q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 48); \ 31298 }) 31299 #else 31300 #define vst2q_u8(__p0, __p1) __extension__ ({ \ 31301 uint8x16x2_t __s1 = __p1; \ 31302 uint8x16x2_t __rev1; \ 31303 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 31304 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 31305 __builtin_neon_vst2q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 48); \ 31306 }) 31307 #endif 31308 31309 #ifdef __LITTLE_ENDIAN__ 31310 #define vst2q_u32(__p0, __p1) __extension__ ({ \ 31311 uint32x4x2_t __s1 = __p1; \ 31312 __builtin_neon_vst2q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 50); \ 31313 }) 31314 #else 31315 #define vst2q_u32(__p0, __p1) __extension__ ({ \ 31316 uint32x4x2_t __s1 = __p1; \ 31317 uint32x4x2_t __rev1; \ 31318 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 31319 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 31320 __builtin_neon_vst2q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 50); \ 31321 }) 31322 #endif 31323 31324 #ifdef __LITTLE_ENDIAN__ 31325 #define vst2q_u16(__p0, __p1) __extension__ ({ \ 31326 uint16x8x2_t __s1 = __p1; \ 31327 __builtin_neon_vst2q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 49); \ 31328 }) 31329 #else 31330 #define vst2q_u16(__p0, __p1) __extension__ ({ \ 31331 uint16x8x2_t __s1 = __p1; \ 31332 uint16x8x2_t __rev1; \ 31333 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 31334 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 31335 __builtin_neon_vst2q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 49); \ 31336 }) 31337 #endif 31338 31339 #ifdef __LITTLE_ENDIAN__ 31340 #define vst2q_s8(__p0, __p1) __extension__ ({ \ 31341 int8x16x2_t __s1 = __p1; \ 31342 __builtin_neon_vst2q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 32); \ 31343 }) 31344 #else 31345 #define vst2q_s8(__p0, __p1) __extension__ ({ \ 31346 int8x16x2_t __s1 = __p1; \ 31347 int8x16x2_t __rev1; \ 31348 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 31349 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 31350 __builtin_neon_vst2q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 32); \ 31351 }) 31352 #endif 31353 31354 #ifdef __LITTLE_ENDIAN__ 31355 #define vst2q_f32(__p0, __p1) __extension__ ({ \ 31356 float32x4x2_t __s1 = __p1; \ 31357 __builtin_neon_vst2q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 41); \ 31358 }) 31359 #else 31360 #define vst2q_f32(__p0, __p1) __extension__ ({ \ 31361 float32x4x2_t __s1 = __p1; \ 31362 float32x4x2_t __rev1; \ 31363 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 31364 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 31365 __builtin_neon_vst2q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 41); \ 31366 }) 31367 #endif 31368 31369 #ifdef __LITTLE_ENDIAN__ 31370 #define vst2q_s32(__p0, __p1) __extension__ ({ \ 31371 int32x4x2_t __s1 = __p1; \ 31372 __builtin_neon_vst2q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 34); \ 31373 }) 31374 #else 31375 #define vst2q_s32(__p0, __p1) __extension__ ({ \ 31376 int32x4x2_t __s1 = __p1; \ 31377 int32x4x2_t __rev1; \ 31378 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 31379 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 31380 __builtin_neon_vst2q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 34); \ 31381 }) 31382 #endif 31383 31384 #ifdef __LITTLE_ENDIAN__ 31385 #define vst2q_s16(__p0, __p1) __extension__ ({ \ 31386 int16x8x2_t __s1 = __p1; \ 31387 __builtin_neon_vst2q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 33); \ 31388 }) 31389 #else 31390 #define vst2q_s16(__p0, __p1) __extension__ ({ \ 31391 int16x8x2_t __s1 = __p1; \ 31392 int16x8x2_t __rev1; \ 31393 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 31394 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 31395 __builtin_neon_vst2q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 33); \ 31396 }) 31397 #endif 31398 31399 #ifdef __LITTLE_ENDIAN__ 31400 #define vst2_u8(__p0, __p1) __extension__ ({ \ 31401 uint8x8x2_t __s1 = __p1; \ 31402 __builtin_neon_vst2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 16); \ 31403 }) 31404 #else 31405 #define vst2_u8(__p0, __p1) __extension__ ({ \ 31406 uint8x8x2_t __s1 = __p1; \ 31407 uint8x8x2_t __rev1; \ 31408 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 31409 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 31410 __builtin_neon_vst2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 16); \ 31411 }) 31412 #endif 31413 31414 #ifdef __LITTLE_ENDIAN__ 31415 #define vst2_u32(__p0, __p1) __extension__ ({ \ 31416 uint32x2x2_t __s1 = __p1; \ 31417 __builtin_neon_vst2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 18); \ 31418 }) 31419 #else 31420 #define vst2_u32(__p0, __p1) __extension__ ({ \ 31421 uint32x2x2_t __s1 = __p1; \ 31422 uint32x2x2_t __rev1; \ 31423 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 31424 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 31425 __builtin_neon_vst2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 18); \ 31426 }) 31427 #endif 31428 31429 #define vst2_u64(__p0, __p1) __extension__ ({ \ 31430 uint64x1x2_t __s1 = __p1; \ 31431 __builtin_neon_vst2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 19); \ 31432 }) 31433 #ifdef __LITTLE_ENDIAN__ 31434 #define vst2_u16(__p0, __p1) __extension__ ({ \ 31435 uint16x4x2_t __s1 = __p1; \ 31436 __builtin_neon_vst2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 17); \ 31437 }) 31438 #else 31439 #define vst2_u16(__p0, __p1) __extension__ ({ \ 31440 uint16x4x2_t __s1 = __p1; \ 31441 uint16x4x2_t __rev1; \ 31442 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 31443 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 31444 __builtin_neon_vst2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 17); \ 31445 }) 31446 #endif 31447 31448 #ifdef __LITTLE_ENDIAN__ 31449 #define vst2_s8(__p0, __p1) __extension__ ({ \ 31450 int8x8x2_t __s1 = __p1; \ 31451 __builtin_neon_vst2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 0); \ 31452 }) 31453 #else 31454 #define vst2_s8(__p0, __p1) __extension__ ({ \ 31455 int8x8x2_t __s1 = __p1; \ 31456 int8x8x2_t __rev1; \ 31457 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 31458 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 31459 __builtin_neon_vst2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 0); \ 31460 }) 31461 #endif 31462 31463 #ifdef __LITTLE_ENDIAN__ 31464 #define vst2_f32(__p0, __p1) __extension__ ({ \ 31465 float32x2x2_t __s1 = __p1; \ 31466 __builtin_neon_vst2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 9); \ 31467 }) 31468 #else 31469 #define vst2_f32(__p0, __p1) __extension__ ({ \ 31470 float32x2x2_t __s1 = __p1; \ 31471 float32x2x2_t __rev1; \ 31472 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 31473 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 31474 __builtin_neon_vst2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 9); \ 31475 }) 31476 #endif 31477 31478 #ifdef __LITTLE_ENDIAN__ 31479 #define vst2_s32(__p0, __p1) __extension__ ({ \ 31480 int32x2x2_t __s1 = __p1; \ 31481 __builtin_neon_vst2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 2); \ 31482 }) 31483 #else 31484 #define vst2_s32(__p0, __p1) __extension__ ({ \ 31485 int32x2x2_t __s1 = __p1; \ 31486 int32x2x2_t __rev1; \ 31487 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 31488 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 31489 __builtin_neon_vst2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 2); \ 31490 }) 31491 #endif 31492 31493 #define vst2_s64(__p0, __p1) __extension__ ({ \ 31494 int64x1x2_t __s1 = __p1; \ 31495 __builtin_neon_vst2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 3); \ 31496 }) 31497 #ifdef __LITTLE_ENDIAN__ 31498 #define vst2_s16(__p0, __p1) __extension__ ({ \ 31499 int16x4x2_t __s1 = __p1; \ 31500 __builtin_neon_vst2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 1); \ 31501 }) 31502 #else 31503 #define vst2_s16(__p0, __p1) __extension__ ({ \ 31504 int16x4x2_t __s1 = __p1; \ 31505 int16x4x2_t __rev1; \ 31506 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 31507 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 31508 __builtin_neon_vst2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 1); \ 31509 }) 31510 #endif 31511 31512 #ifdef __LITTLE_ENDIAN__ 31513 #define vst2_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 31514 poly8x8x2_t __s1 = __p1; \ 31515 __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 4); \ 31516 }) 31517 #else 31518 #define vst2_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 31519 poly8x8x2_t __s1 = __p1; \ 31520 poly8x8x2_t __rev1; \ 31521 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 31522 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 31523 __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 4); \ 31524 }) 31525 #endif 31526 31527 #ifdef __LITTLE_ENDIAN__ 31528 #define vst2_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 31529 poly16x4x2_t __s1 = __p1; \ 31530 __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 5); \ 31531 }) 31532 #else 31533 #define vst2_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 31534 poly16x4x2_t __s1 = __p1; \ 31535 poly16x4x2_t __rev1; \ 31536 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 31537 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 31538 __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 5); \ 31539 }) 31540 #endif 31541 31542 #ifdef __LITTLE_ENDIAN__ 31543 #define vst2q_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 31544 poly16x8x2_t __s1 = __p1; \ 31545 __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 37); \ 31546 }) 31547 #else 31548 #define vst2q_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 31549 poly16x8x2_t __s1 = __p1; \ 31550 poly16x8x2_t __rev1; \ 31551 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 31552 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 31553 __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 37); \ 31554 }) 31555 #endif 31556 31557 #ifdef __LITTLE_ENDIAN__ 31558 #define vst2q_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 31559 uint32x4x2_t __s1 = __p1; \ 31560 __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 50); \ 31561 }) 31562 #else 31563 #define vst2q_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 31564 uint32x4x2_t __s1 = __p1; \ 31565 uint32x4x2_t __rev1; \ 31566 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 31567 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 31568 __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 50); \ 31569 }) 31570 #endif 31571 31572 #ifdef __LITTLE_ENDIAN__ 31573 #define vst2q_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 31574 uint16x8x2_t __s1 = __p1; \ 31575 __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 49); \ 31576 }) 31577 #else 31578 #define vst2q_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 31579 uint16x8x2_t __s1 = __p1; \ 31580 uint16x8x2_t __rev1; \ 31581 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 31582 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 31583 __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 49); \ 31584 }) 31585 #endif 31586 31587 #ifdef __LITTLE_ENDIAN__ 31588 #define vst2q_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 31589 float32x4x2_t __s1 = __p1; \ 31590 __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 41); \ 31591 }) 31592 #else 31593 #define vst2q_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 31594 float32x4x2_t __s1 = __p1; \ 31595 float32x4x2_t __rev1; \ 31596 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 31597 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 31598 __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 41); \ 31599 }) 31600 #endif 31601 31602 #ifdef __LITTLE_ENDIAN__ 31603 #define vst2q_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 31604 int32x4x2_t __s1 = __p1; \ 31605 __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 34); \ 31606 }) 31607 #else 31608 #define vst2q_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 31609 int32x4x2_t __s1 = __p1; \ 31610 int32x4x2_t __rev1; \ 31611 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 31612 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 31613 __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 34); \ 31614 }) 31615 #endif 31616 31617 #ifdef __LITTLE_ENDIAN__ 31618 #define vst2q_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 31619 int16x8x2_t __s1 = __p1; \ 31620 __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 33); \ 31621 }) 31622 #else 31623 #define vst2q_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 31624 int16x8x2_t __s1 = __p1; \ 31625 int16x8x2_t __rev1; \ 31626 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 31627 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 31628 __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 33); \ 31629 }) 31630 #endif 31631 31632 #ifdef __LITTLE_ENDIAN__ 31633 #define vst2_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 31634 uint8x8x2_t __s1 = __p1; \ 31635 __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 16); \ 31636 }) 31637 #else 31638 #define vst2_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 31639 uint8x8x2_t __s1 = __p1; \ 31640 uint8x8x2_t __rev1; \ 31641 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 31642 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 31643 __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 16); \ 31644 }) 31645 #endif 31646 31647 #ifdef __LITTLE_ENDIAN__ 31648 #define vst2_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 31649 uint32x2x2_t __s1 = __p1; \ 31650 __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 18); \ 31651 }) 31652 #else 31653 #define vst2_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 31654 uint32x2x2_t __s1 = __p1; \ 31655 uint32x2x2_t __rev1; \ 31656 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 31657 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 31658 __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 18); \ 31659 }) 31660 #endif 31661 31662 #ifdef __LITTLE_ENDIAN__ 31663 #define vst2_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 31664 uint16x4x2_t __s1 = __p1; \ 31665 __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 17); \ 31666 }) 31667 #else 31668 #define vst2_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 31669 uint16x4x2_t __s1 = __p1; \ 31670 uint16x4x2_t __rev1; \ 31671 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 31672 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 31673 __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 17); \ 31674 }) 31675 #endif 31676 31677 #ifdef __LITTLE_ENDIAN__ 31678 #define vst2_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 31679 int8x8x2_t __s1 = __p1; \ 31680 __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 0); \ 31681 }) 31682 #else 31683 #define vst2_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 31684 int8x8x2_t __s1 = __p1; \ 31685 int8x8x2_t __rev1; \ 31686 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 31687 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 31688 __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 0); \ 31689 }) 31690 #endif 31691 31692 #ifdef __LITTLE_ENDIAN__ 31693 #define vst2_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 31694 float32x2x2_t __s1 = __p1; \ 31695 __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 9); \ 31696 }) 31697 #else 31698 #define vst2_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 31699 float32x2x2_t __s1 = __p1; \ 31700 float32x2x2_t __rev1; \ 31701 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 31702 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 31703 __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 9); \ 31704 }) 31705 #endif 31706 31707 #ifdef __LITTLE_ENDIAN__ 31708 #define vst2_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 31709 int32x2x2_t __s1 = __p1; \ 31710 __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 2); \ 31711 }) 31712 #else 31713 #define vst2_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 31714 int32x2x2_t __s1 = __p1; \ 31715 int32x2x2_t __rev1; \ 31716 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 31717 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 31718 __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 2); \ 31719 }) 31720 #endif 31721 31722 #ifdef __LITTLE_ENDIAN__ 31723 #define vst2_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 31724 int16x4x2_t __s1 = __p1; \ 31725 __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 1); \ 31726 }) 31727 #else 31728 #define vst2_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 31729 int16x4x2_t __s1 = __p1; \ 31730 int16x4x2_t __rev1; \ 31731 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 31732 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 31733 __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 1); \ 31734 }) 31735 #endif 31736 31737 #ifdef __LITTLE_ENDIAN__ 31738 #define vst3_p8(__p0, __p1) __extension__ ({ \ 31739 poly8x8x3_t __s1 = __p1; \ 31740 __builtin_neon_vst3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 4); \ 31741 }) 31742 #else 31743 #define vst3_p8(__p0, __p1) __extension__ ({ \ 31744 poly8x8x3_t __s1 = __p1; \ 31745 poly8x8x3_t __rev1; \ 31746 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 31747 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 31748 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 31749 __builtin_neon_vst3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 4); \ 31750 }) 31751 #endif 31752 31753 #ifdef __LITTLE_ENDIAN__ 31754 #define vst3_p16(__p0, __p1) __extension__ ({ \ 31755 poly16x4x3_t __s1 = __p1; \ 31756 __builtin_neon_vst3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 5); \ 31757 }) 31758 #else 31759 #define vst3_p16(__p0, __p1) __extension__ ({ \ 31760 poly16x4x3_t __s1 = __p1; \ 31761 poly16x4x3_t __rev1; \ 31762 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 31763 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 31764 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 31765 __builtin_neon_vst3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 5); \ 31766 }) 31767 #endif 31768 31769 #ifdef __LITTLE_ENDIAN__ 31770 #define vst3q_p8(__p0, __p1) __extension__ ({ \ 31771 poly8x16x3_t __s1 = __p1; \ 31772 __builtin_neon_vst3q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 36); \ 31773 }) 31774 #else 31775 #define vst3q_p8(__p0, __p1) __extension__ ({ \ 31776 poly8x16x3_t __s1 = __p1; \ 31777 poly8x16x3_t __rev1; \ 31778 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 31779 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 31780 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 31781 __builtin_neon_vst3q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 36); \ 31782 }) 31783 #endif 31784 31785 #ifdef __LITTLE_ENDIAN__ 31786 #define vst3q_p16(__p0, __p1) __extension__ ({ \ 31787 poly16x8x3_t __s1 = __p1; \ 31788 __builtin_neon_vst3q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 37); \ 31789 }) 31790 #else 31791 #define vst3q_p16(__p0, __p1) __extension__ ({ \ 31792 poly16x8x3_t __s1 = __p1; \ 31793 poly16x8x3_t __rev1; \ 31794 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 31795 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 31796 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 31797 __builtin_neon_vst3q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 37); \ 31798 }) 31799 #endif 31800 31801 #ifdef __LITTLE_ENDIAN__ 31802 #define vst3q_u8(__p0, __p1) __extension__ ({ \ 31803 uint8x16x3_t __s1 = __p1; \ 31804 __builtin_neon_vst3q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 48); \ 31805 }) 31806 #else 31807 #define vst3q_u8(__p0, __p1) __extension__ ({ \ 31808 uint8x16x3_t __s1 = __p1; \ 31809 uint8x16x3_t __rev1; \ 31810 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 31811 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 31812 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 31813 __builtin_neon_vst3q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 48); \ 31814 }) 31815 #endif 31816 31817 #ifdef __LITTLE_ENDIAN__ 31818 #define vst3q_u32(__p0, __p1) __extension__ ({ \ 31819 uint32x4x3_t __s1 = __p1; \ 31820 __builtin_neon_vst3q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 50); \ 31821 }) 31822 #else 31823 #define vst3q_u32(__p0, __p1) __extension__ ({ \ 31824 uint32x4x3_t __s1 = __p1; \ 31825 uint32x4x3_t __rev1; \ 31826 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 31827 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 31828 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 31829 __builtin_neon_vst3q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 50); \ 31830 }) 31831 #endif 31832 31833 #ifdef __LITTLE_ENDIAN__ 31834 #define vst3q_u16(__p0, __p1) __extension__ ({ \ 31835 uint16x8x3_t __s1 = __p1; \ 31836 __builtin_neon_vst3q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 49); \ 31837 }) 31838 #else 31839 #define vst3q_u16(__p0, __p1) __extension__ ({ \ 31840 uint16x8x3_t __s1 = __p1; \ 31841 uint16x8x3_t __rev1; \ 31842 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 31843 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 31844 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 31845 __builtin_neon_vst3q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 49); \ 31846 }) 31847 #endif 31848 31849 #ifdef __LITTLE_ENDIAN__ 31850 #define vst3q_s8(__p0, __p1) __extension__ ({ \ 31851 int8x16x3_t __s1 = __p1; \ 31852 __builtin_neon_vst3q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 32); \ 31853 }) 31854 #else 31855 #define vst3q_s8(__p0, __p1) __extension__ ({ \ 31856 int8x16x3_t __s1 = __p1; \ 31857 int8x16x3_t __rev1; \ 31858 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 31859 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 31860 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 31861 __builtin_neon_vst3q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 32); \ 31862 }) 31863 #endif 31864 31865 #ifdef __LITTLE_ENDIAN__ 31866 #define vst3q_f32(__p0, __p1) __extension__ ({ \ 31867 float32x4x3_t __s1 = __p1; \ 31868 __builtin_neon_vst3q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 41); \ 31869 }) 31870 #else 31871 #define vst3q_f32(__p0, __p1) __extension__ ({ \ 31872 float32x4x3_t __s1 = __p1; \ 31873 float32x4x3_t __rev1; \ 31874 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 31875 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 31876 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 31877 __builtin_neon_vst3q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 41); \ 31878 }) 31879 #endif 31880 31881 #ifdef __LITTLE_ENDIAN__ 31882 #define vst3q_s32(__p0, __p1) __extension__ ({ \ 31883 int32x4x3_t __s1 = __p1; \ 31884 __builtin_neon_vst3q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 34); \ 31885 }) 31886 #else 31887 #define vst3q_s32(__p0, __p1) __extension__ ({ \ 31888 int32x4x3_t __s1 = __p1; \ 31889 int32x4x3_t __rev1; \ 31890 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 31891 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 31892 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 31893 __builtin_neon_vst3q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 34); \ 31894 }) 31895 #endif 31896 31897 #ifdef __LITTLE_ENDIAN__ 31898 #define vst3q_s16(__p0, __p1) __extension__ ({ \ 31899 int16x8x3_t __s1 = __p1; \ 31900 __builtin_neon_vst3q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 33); \ 31901 }) 31902 #else 31903 #define vst3q_s16(__p0, __p1) __extension__ ({ \ 31904 int16x8x3_t __s1 = __p1; \ 31905 int16x8x3_t __rev1; \ 31906 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 31907 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 31908 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 31909 __builtin_neon_vst3q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 33); \ 31910 }) 31911 #endif 31912 31913 #ifdef __LITTLE_ENDIAN__ 31914 #define vst3_u8(__p0, __p1) __extension__ ({ \ 31915 uint8x8x3_t __s1 = __p1; \ 31916 __builtin_neon_vst3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 16); \ 31917 }) 31918 #else 31919 #define vst3_u8(__p0, __p1) __extension__ ({ \ 31920 uint8x8x3_t __s1 = __p1; \ 31921 uint8x8x3_t __rev1; \ 31922 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 31923 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 31924 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 31925 __builtin_neon_vst3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 16); \ 31926 }) 31927 #endif 31928 31929 #ifdef __LITTLE_ENDIAN__ 31930 #define vst3_u32(__p0, __p1) __extension__ ({ \ 31931 uint32x2x3_t __s1 = __p1; \ 31932 __builtin_neon_vst3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 18); \ 31933 }) 31934 #else 31935 #define vst3_u32(__p0, __p1) __extension__ ({ \ 31936 uint32x2x3_t __s1 = __p1; \ 31937 uint32x2x3_t __rev1; \ 31938 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 31939 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 31940 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 31941 __builtin_neon_vst3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 18); \ 31942 }) 31943 #endif 31944 31945 #define vst3_u64(__p0, __p1) __extension__ ({ \ 31946 uint64x1x3_t __s1 = __p1; \ 31947 __builtin_neon_vst3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 19); \ 31948 }) 31949 #ifdef __LITTLE_ENDIAN__ 31950 #define vst3_u16(__p0, __p1) __extension__ ({ \ 31951 uint16x4x3_t __s1 = __p1; \ 31952 __builtin_neon_vst3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 17); \ 31953 }) 31954 #else 31955 #define vst3_u16(__p0, __p1) __extension__ ({ \ 31956 uint16x4x3_t __s1 = __p1; \ 31957 uint16x4x3_t __rev1; \ 31958 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 31959 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 31960 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 31961 __builtin_neon_vst3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 17); \ 31962 }) 31963 #endif 31964 31965 #ifdef __LITTLE_ENDIAN__ 31966 #define vst3_s8(__p0, __p1) __extension__ ({ \ 31967 int8x8x3_t __s1 = __p1; \ 31968 __builtin_neon_vst3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 0); \ 31969 }) 31970 #else 31971 #define vst3_s8(__p0, __p1) __extension__ ({ \ 31972 int8x8x3_t __s1 = __p1; \ 31973 int8x8x3_t __rev1; \ 31974 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 31975 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 31976 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 31977 __builtin_neon_vst3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 0); \ 31978 }) 31979 #endif 31980 31981 #ifdef __LITTLE_ENDIAN__ 31982 #define vst3_f32(__p0, __p1) __extension__ ({ \ 31983 float32x2x3_t __s1 = __p1; \ 31984 __builtin_neon_vst3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 9); \ 31985 }) 31986 #else 31987 #define vst3_f32(__p0, __p1) __extension__ ({ \ 31988 float32x2x3_t __s1 = __p1; \ 31989 float32x2x3_t __rev1; \ 31990 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 31991 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 31992 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 31993 __builtin_neon_vst3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 9); \ 31994 }) 31995 #endif 31996 31997 #ifdef __LITTLE_ENDIAN__ 31998 #define vst3_s32(__p0, __p1) __extension__ ({ \ 31999 int32x2x3_t __s1 = __p1; \ 32000 __builtin_neon_vst3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 2); \ 32001 }) 32002 #else 32003 #define vst3_s32(__p0, __p1) __extension__ ({ \ 32004 int32x2x3_t __s1 = __p1; \ 32005 int32x2x3_t __rev1; \ 32006 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 32007 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 32008 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 32009 __builtin_neon_vst3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 2); \ 32010 }) 32011 #endif 32012 32013 #define vst3_s64(__p0, __p1) __extension__ ({ \ 32014 int64x1x3_t __s1 = __p1; \ 32015 __builtin_neon_vst3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 3); \ 32016 }) 32017 #ifdef __LITTLE_ENDIAN__ 32018 #define vst3_s16(__p0, __p1) __extension__ ({ \ 32019 int16x4x3_t __s1 = __p1; \ 32020 __builtin_neon_vst3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 1); \ 32021 }) 32022 #else 32023 #define vst3_s16(__p0, __p1) __extension__ ({ \ 32024 int16x4x3_t __s1 = __p1; \ 32025 int16x4x3_t __rev1; \ 32026 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 32027 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 32028 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 32029 __builtin_neon_vst3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 1); \ 32030 }) 32031 #endif 32032 32033 #ifdef __LITTLE_ENDIAN__ 32034 #define vst3_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 32035 poly8x8x3_t __s1 = __p1; \ 32036 __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 4); \ 32037 }) 32038 #else 32039 #define vst3_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 32040 poly8x8x3_t __s1 = __p1; \ 32041 poly8x8x3_t __rev1; \ 32042 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 32043 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 32044 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 32045 __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 4); \ 32046 }) 32047 #endif 32048 32049 #ifdef __LITTLE_ENDIAN__ 32050 #define vst3_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 32051 poly16x4x3_t __s1 = __p1; \ 32052 __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 5); \ 32053 }) 32054 #else 32055 #define vst3_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 32056 poly16x4x3_t __s1 = __p1; \ 32057 poly16x4x3_t __rev1; \ 32058 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 32059 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 32060 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 32061 __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 5); \ 32062 }) 32063 #endif 32064 32065 #ifdef __LITTLE_ENDIAN__ 32066 #define vst3q_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 32067 poly16x8x3_t __s1 = __p1; \ 32068 __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 37); \ 32069 }) 32070 #else 32071 #define vst3q_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 32072 poly16x8x3_t __s1 = __p1; \ 32073 poly16x8x3_t __rev1; \ 32074 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 32075 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 32076 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 32077 __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 37); \ 32078 }) 32079 #endif 32080 32081 #ifdef __LITTLE_ENDIAN__ 32082 #define vst3q_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 32083 uint32x4x3_t __s1 = __p1; \ 32084 __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 50); \ 32085 }) 32086 #else 32087 #define vst3q_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 32088 uint32x4x3_t __s1 = __p1; \ 32089 uint32x4x3_t __rev1; \ 32090 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 32091 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 32092 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 32093 __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 50); \ 32094 }) 32095 #endif 32096 32097 #ifdef __LITTLE_ENDIAN__ 32098 #define vst3q_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 32099 uint16x8x3_t __s1 = __p1; \ 32100 __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 49); \ 32101 }) 32102 #else 32103 #define vst3q_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 32104 uint16x8x3_t __s1 = __p1; \ 32105 uint16x8x3_t __rev1; \ 32106 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 32107 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 32108 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 32109 __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 49); \ 32110 }) 32111 #endif 32112 32113 #ifdef __LITTLE_ENDIAN__ 32114 #define vst3q_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 32115 float32x4x3_t __s1 = __p1; \ 32116 __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 41); \ 32117 }) 32118 #else 32119 #define vst3q_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 32120 float32x4x3_t __s1 = __p1; \ 32121 float32x4x3_t __rev1; \ 32122 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 32123 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 32124 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 32125 __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 41); \ 32126 }) 32127 #endif 32128 32129 #ifdef __LITTLE_ENDIAN__ 32130 #define vst3q_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 32131 int32x4x3_t __s1 = __p1; \ 32132 __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 34); \ 32133 }) 32134 #else 32135 #define vst3q_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 32136 int32x4x3_t __s1 = __p1; \ 32137 int32x4x3_t __rev1; \ 32138 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 32139 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 32140 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 32141 __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 34); \ 32142 }) 32143 #endif 32144 32145 #ifdef __LITTLE_ENDIAN__ 32146 #define vst3q_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 32147 int16x8x3_t __s1 = __p1; \ 32148 __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 33); \ 32149 }) 32150 #else 32151 #define vst3q_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 32152 int16x8x3_t __s1 = __p1; \ 32153 int16x8x3_t __rev1; \ 32154 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 32155 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 32156 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 32157 __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 33); \ 32158 }) 32159 #endif 32160 32161 #ifdef __LITTLE_ENDIAN__ 32162 #define vst3_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 32163 uint8x8x3_t __s1 = __p1; \ 32164 __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 16); \ 32165 }) 32166 #else 32167 #define vst3_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 32168 uint8x8x3_t __s1 = __p1; \ 32169 uint8x8x3_t __rev1; \ 32170 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 32171 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 32172 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 32173 __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 16); \ 32174 }) 32175 #endif 32176 32177 #ifdef __LITTLE_ENDIAN__ 32178 #define vst3_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 32179 uint32x2x3_t __s1 = __p1; \ 32180 __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 18); \ 32181 }) 32182 #else 32183 #define vst3_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 32184 uint32x2x3_t __s1 = __p1; \ 32185 uint32x2x3_t __rev1; \ 32186 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 32187 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 32188 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 32189 __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 18); \ 32190 }) 32191 #endif 32192 32193 #ifdef __LITTLE_ENDIAN__ 32194 #define vst3_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 32195 uint16x4x3_t __s1 = __p1; \ 32196 __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 17); \ 32197 }) 32198 #else 32199 #define vst3_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 32200 uint16x4x3_t __s1 = __p1; \ 32201 uint16x4x3_t __rev1; \ 32202 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 32203 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 32204 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 32205 __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 17); \ 32206 }) 32207 #endif 32208 32209 #ifdef __LITTLE_ENDIAN__ 32210 #define vst3_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 32211 int8x8x3_t __s1 = __p1; \ 32212 __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 0); \ 32213 }) 32214 #else 32215 #define vst3_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 32216 int8x8x3_t __s1 = __p1; \ 32217 int8x8x3_t __rev1; \ 32218 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 32219 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 32220 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 32221 __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 0); \ 32222 }) 32223 #endif 32224 32225 #ifdef __LITTLE_ENDIAN__ 32226 #define vst3_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 32227 float32x2x3_t __s1 = __p1; \ 32228 __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 9); \ 32229 }) 32230 #else 32231 #define vst3_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 32232 float32x2x3_t __s1 = __p1; \ 32233 float32x2x3_t __rev1; \ 32234 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 32235 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 32236 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 32237 __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 9); \ 32238 }) 32239 #endif 32240 32241 #ifdef __LITTLE_ENDIAN__ 32242 #define vst3_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 32243 int32x2x3_t __s1 = __p1; \ 32244 __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 2); \ 32245 }) 32246 #else 32247 #define vst3_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 32248 int32x2x3_t __s1 = __p1; \ 32249 int32x2x3_t __rev1; \ 32250 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 32251 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 32252 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 32253 __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 2); \ 32254 }) 32255 #endif 32256 32257 #ifdef __LITTLE_ENDIAN__ 32258 #define vst3_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 32259 int16x4x3_t __s1 = __p1; \ 32260 __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 1); \ 32261 }) 32262 #else 32263 #define vst3_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 32264 int16x4x3_t __s1 = __p1; \ 32265 int16x4x3_t __rev1; \ 32266 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 32267 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 32268 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 32269 __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 1); \ 32270 }) 32271 #endif 32272 32273 #ifdef __LITTLE_ENDIAN__ 32274 #define vst4_p8(__p0, __p1) __extension__ ({ \ 32275 poly8x8x4_t __s1 = __p1; \ 32276 __builtin_neon_vst4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 4); \ 32277 }) 32278 #else 32279 #define vst4_p8(__p0, __p1) __extension__ ({ \ 32280 poly8x8x4_t __s1 = __p1; \ 32281 poly8x8x4_t __rev1; \ 32282 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 32283 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 32284 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 32285 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 32286 __builtin_neon_vst4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 4); \ 32287 }) 32288 #endif 32289 32290 #ifdef __LITTLE_ENDIAN__ 32291 #define vst4_p16(__p0, __p1) __extension__ ({ \ 32292 poly16x4x4_t __s1 = __p1; \ 32293 __builtin_neon_vst4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 5); \ 32294 }) 32295 #else 32296 #define vst4_p16(__p0, __p1) __extension__ ({ \ 32297 poly16x4x4_t __s1 = __p1; \ 32298 poly16x4x4_t __rev1; \ 32299 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 32300 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 32301 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 32302 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \ 32303 __builtin_neon_vst4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 5); \ 32304 }) 32305 #endif 32306 32307 #ifdef __LITTLE_ENDIAN__ 32308 #define vst4q_p8(__p0, __p1) __extension__ ({ \ 32309 poly8x16x4_t __s1 = __p1; \ 32310 __builtin_neon_vst4q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 36); \ 32311 }) 32312 #else 32313 #define vst4q_p8(__p0, __p1) __extension__ ({ \ 32314 poly8x16x4_t __s1 = __p1; \ 32315 poly8x16x4_t __rev1; \ 32316 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 32317 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 32318 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 32319 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 32320 __builtin_neon_vst4q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 36); \ 32321 }) 32322 #endif 32323 32324 #ifdef __LITTLE_ENDIAN__ 32325 #define vst4q_p16(__p0, __p1) __extension__ ({ \ 32326 poly16x8x4_t __s1 = __p1; \ 32327 __builtin_neon_vst4q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 37); \ 32328 }) 32329 #else 32330 #define vst4q_p16(__p0, __p1) __extension__ ({ \ 32331 poly16x8x4_t __s1 = __p1; \ 32332 poly16x8x4_t __rev1; \ 32333 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 32334 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 32335 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 32336 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 32337 __builtin_neon_vst4q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 37); \ 32338 }) 32339 #endif 32340 32341 #ifdef __LITTLE_ENDIAN__ 32342 #define vst4q_u8(__p0, __p1) __extension__ ({ \ 32343 uint8x16x4_t __s1 = __p1; \ 32344 __builtin_neon_vst4q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 48); \ 32345 }) 32346 #else 32347 #define vst4q_u8(__p0, __p1) __extension__ ({ \ 32348 uint8x16x4_t __s1 = __p1; \ 32349 uint8x16x4_t __rev1; \ 32350 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 32351 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 32352 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 32353 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 32354 __builtin_neon_vst4q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 48); \ 32355 }) 32356 #endif 32357 32358 #ifdef __LITTLE_ENDIAN__ 32359 #define vst4q_u32(__p0, __p1) __extension__ ({ \ 32360 uint32x4x4_t __s1 = __p1; \ 32361 __builtin_neon_vst4q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 50); \ 32362 }) 32363 #else 32364 #define vst4q_u32(__p0, __p1) __extension__ ({ \ 32365 uint32x4x4_t __s1 = __p1; \ 32366 uint32x4x4_t __rev1; \ 32367 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 32368 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 32369 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 32370 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \ 32371 __builtin_neon_vst4q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 50); \ 32372 }) 32373 #endif 32374 32375 #ifdef __LITTLE_ENDIAN__ 32376 #define vst4q_u16(__p0, __p1) __extension__ ({ \ 32377 uint16x8x4_t __s1 = __p1; \ 32378 __builtin_neon_vst4q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 49); \ 32379 }) 32380 #else 32381 #define vst4q_u16(__p0, __p1) __extension__ ({ \ 32382 uint16x8x4_t __s1 = __p1; \ 32383 uint16x8x4_t __rev1; \ 32384 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 32385 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 32386 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 32387 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 32388 __builtin_neon_vst4q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 49); \ 32389 }) 32390 #endif 32391 32392 #ifdef __LITTLE_ENDIAN__ 32393 #define vst4q_s8(__p0, __p1) __extension__ ({ \ 32394 int8x16x4_t __s1 = __p1; \ 32395 __builtin_neon_vst4q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 32); \ 32396 }) 32397 #else 32398 #define vst4q_s8(__p0, __p1) __extension__ ({ \ 32399 int8x16x4_t __s1 = __p1; \ 32400 int8x16x4_t __rev1; \ 32401 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 32402 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 32403 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 32404 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 32405 __builtin_neon_vst4q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 32); \ 32406 }) 32407 #endif 32408 32409 #ifdef __LITTLE_ENDIAN__ 32410 #define vst4q_f32(__p0, __p1) __extension__ ({ \ 32411 float32x4x4_t __s1 = __p1; \ 32412 __builtin_neon_vst4q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 41); \ 32413 }) 32414 #else 32415 #define vst4q_f32(__p0, __p1) __extension__ ({ \ 32416 float32x4x4_t __s1 = __p1; \ 32417 float32x4x4_t __rev1; \ 32418 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 32419 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 32420 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 32421 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \ 32422 __builtin_neon_vst4q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 41); \ 32423 }) 32424 #endif 32425 32426 #ifdef __LITTLE_ENDIAN__ 32427 #define vst4q_s32(__p0, __p1) __extension__ ({ \ 32428 int32x4x4_t __s1 = __p1; \ 32429 __builtin_neon_vst4q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 34); \ 32430 }) 32431 #else 32432 #define vst4q_s32(__p0, __p1) __extension__ ({ \ 32433 int32x4x4_t __s1 = __p1; \ 32434 int32x4x4_t __rev1; \ 32435 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 32436 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 32437 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 32438 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \ 32439 __builtin_neon_vst4q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 34); \ 32440 }) 32441 #endif 32442 32443 #ifdef __LITTLE_ENDIAN__ 32444 #define vst4q_s16(__p0, __p1) __extension__ ({ \ 32445 int16x8x4_t __s1 = __p1; \ 32446 __builtin_neon_vst4q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 33); \ 32447 }) 32448 #else 32449 #define vst4q_s16(__p0, __p1) __extension__ ({ \ 32450 int16x8x4_t __s1 = __p1; \ 32451 int16x8x4_t __rev1; \ 32452 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 32453 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 32454 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 32455 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 32456 __builtin_neon_vst4q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 33); \ 32457 }) 32458 #endif 32459 32460 #ifdef __LITTLE_ENDIAN__ 32461 #define vst4_u8(__p0, __p1) __extension__ ({ \ 32462 uint8x8x4_t __s1 = __p1; \ 32463 __builtin_neon_vst4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 16); \ 32464 }) 32465 #else 32466 #define vst4_u8(__p0, __p1) __extension__ ({ \ 32467 uint8x8x4_t __s1 = __p1; \ 32468 uint8x8x4_t __rev1; \ 32469 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 32470 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 32471 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 32472 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 32473 __builtin_neon_vst4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 16); \ 32474 }) 32475 #endif 32476 32477 #ifdef __LITTLE_ENDIAN__ 32478 #define vst4_u32(__p0, __p1) __extension__ ({ \ 32479 uint32x2x4_t __s1 = __p1; \ 32480 __builtin_neon_vst4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 18); \ 32481 }) 32482 #else 32483 #define vst4_u32(__p0, __p1) __extension__ ({ \ 32484 uint32x2x4_t __s1 = __p1; \ 32485 uint32x2x4_t __rev1; \ 32486 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 32487 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 32488 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 32489 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \ 32490 __builtin_neon_vst4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 18); \ 32491 }) 32492 #endif 32493 32494 #define vst4_u64(__p0, __p1) __extension__ ({ \ 32495 uint64x1x4_t __s1 = __p1; \ 32496 __builtin_neon_vst4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 19); \ 32497 }) 32498 #ifdef __LITTLE_ENDIAN__ 32499 #define vst4_u16(__p0, __p1) __extension__ ({ \ 32500 uint16x4x4_t __s1 = __p1; \ 32501 __builtin_neon_vst4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 17); \ 32502 }) 32503 #else 32504 #define vst4_u16(__p0, __p1) __extension__ ({ \ 32505 uint16x4x4_t __s1 = __p1; \ 32506 uint16x4x4_t __rev1; \ 32507 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 32508 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 32509 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 32510 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \ 32511 __builtin_neon_vst4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 17); \ 32512 }) 32513 #endif 32514 32515 #ifdef __LITTLE_ENDIAN__ 32516 #define vst4_s8(__p0, __p1) __extension__ ({ \ 32517 int8x8x4_t __s1 = __p1; \ 32518 __builtin_neon_vst4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 0); \ 32519 }) 32520 #else 32521 #define vst4_s8(__p0, __p1) __extension__ ({ \ 32522 int8x8x4_t __s1 = __p1; \ 32523 int8x8x4_t __rev1; \ 32524 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 32525 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 32526 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 32527 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 32528 __builtin_neon_vst4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 0); \ 32529 }) 32530 #endif 32531 32532 #ifdef __LITTLE_ENDIAN__ 32533 #define vst4_f32(__p0, __p1) __extension__ ({ \ 32534 float32x2x4_t __s1 = __p1; \ 32535 __builtin_neon_vst4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 9); \ 32536 }) 32537 #else 32538 #define vst4_f32(__p0, __p1) __extension__ ({ \ 32539 float32x2x4_t __s1 = __p1; \ 32540 float32x2x4_t __rev1; \ 32541 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 32542 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 32543 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 32544 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \ 32545 __builtin_neon_vst4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 9); \ 32546 }) 32547 #endif 32548 32549 #ifdef __LITTLE_ENDIAN__ 32550 #define vst4_s32(__p0, __p1) __extension__ ({ \ 32551 int32x2x4_t __s1 = __p1; \ 32552 __builtin_neon_vst4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 2); \ 32553 }) 32554 #else 32555 #define vst4_s32(__p0, __p1) __extension__ ({ \ 32556 int32x2x4_t __s1 = __p1; \ 32557 int32x2x4_t __rev1; \ 32558 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 32559 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 32560 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 32561 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \ 32562 __builtin_neon_vst4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 2); \ 32563 }) 32564 #endif 32565 32566 #define vst4_s64(__p0, __p1) __extension__ ({ \ 32567 int64x1x4_t __s1 = __p1; \ 32568 __builtin_neon_vst4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 3); \ 32569 }) 32570 #ifdef __LITTLE_ENDIAN__ 32571 #define vst4_s16(__p0, __p1) __extension__ ({ \ 32572 int16x4x4_t __s1 = __p1; \ 32573 __builtin_neon_vst4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 1); \ 32574 }) 32575 #else 32576 #define vst4_s16(__p0, __p1) __extension__ ({ \ 32577 int16x4x4_t __s1 = __p1; \ 32578 int16x4x4_t __rev1; \ 32579 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 32580 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 32581 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 32582 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \ 32583 __builtin_neon_vst4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 1); \ 32584 }) 32585 #endif 32586 32587 #ifdef __LITTLE_ENDIAN__ 32588 #define vst4_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 32589 poly8x8x4_t __s1 = __p1; \ 32590 __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 4); \ 32591 }) 32592 #else 32593 #define vst4_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 32594 poly8x8x4_t __s1 = __p1; \ 32595 poly8x8x4_t __rev1; \ 32596 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 32597 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 32598 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 32599 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 32600 __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 4); \ 32601 }) 32602 #endif 32603 32604 #ifdef __LITTLE_ENDIAN__ 32605 #define vst4_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 32606 poly16x4x4_t __s1 = __p1; \ 32607 __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 5); \ 32608 }) 32609 #else 32610 #define vst4_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 32611 poly16x4x4_t __s1 = __p1; \ 32612 poly16x4x4_t __rev1; \ 32613 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 32614 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 32615 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 32616 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \ 32617 __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 5); \ 32618 }) 32619 #endif 32620 32621 #ifdef __LITTLE_ENDIAN__ 32622 #define vst4q_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 32623 poly16x8x4_t __s1 = __p1; \ 32624 __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 37); \ 32625 }) 32626 #else 32627 #define vst4q_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 32628 poly16x8x4_t __s1 = __p1; \ 32629 poly16x8x4_t __rev1; \ 32630 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 32631 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 32632 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 32633 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 32634 __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 37); \ 32635 }) 32636 #endif 32637 32638 #ifdef __LITTLE_ENDIAN__ 32639 #define vst4q_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 32640 uint32x4x4_t __s1 = __p1; \ 32641 __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 50); \ 32642 }) 32643 #else 32644 #define vst4q_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 32645 uint32x4x4_t __s1 = __p1; \ 32646 uint32x4x4_t __rev1; \ 32647 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 32648 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 32649 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 32650 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \ 32651 __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 50); \ 32652 }) 32653 #endif 32654 32655 #ifdef __LITTLE_ENDIAN__ 32656 #define vst4q_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 32657 uint16x8x4_t __s1 = __p1; \ 32658 __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 49); \ 32659 }) 32660 #else 32661 #define vst4q_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 32662 uint16x8x4_t __s1 = __p1; \ 32663 uint16x8x4_t __rev1; \ 32664 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 32665 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 32666 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 32667 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 32668 __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 49); \ 32669 }) 32670 #endif 32671 32672 #ifdef __LITTLE_ENDIAN__ 32673 #define vst4q_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 32674 float32x4x4_t __s1 = __p1; \ 32675 __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 41); \ 32676 }) 32677 #else 32678 #define vst4q_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 32679 float32x4x4_t __s1 = __p1; \ 32680 float32x4x4_t __rev1; \ 32681 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 32682 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 32683 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 32684 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \ 32685 __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 41); \ 32686 }) 32687 #endif 32688 32689 #ifdef __LITTLE_ENDIAN__ 32690 #define vst4q_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 32691 int32x4x4_t __s1 = __p1; \ 32692 __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 34); \ 32693 }) 32694 #else 32695 #define vst4q_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 32696 int32x4x4_t __s1 = __p1; \ 32697 int32x4x4_t __rev1; \ 32698 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 32699 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 32700 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 32701 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \ 32702 __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 34); \ 32703 }) 32704 #endif 32705 32706 #ifdef __LITTLE_ENDIAN__ 32707 #define vst4q_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 32708 int16x8x4_t __s1 = __p1; \ 32709 __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 33); \ 32710 }) 32711 #else 32712 #define vst4q_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 32713 int16x8x4_t __s1 = __p1; \ 32714 int16x8x4_t __rev1; \ 32715 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 32716 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 32717 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 32718 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 32719 __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 33); \ 32720 }) 32721 #endif 32722 32723 #ifdef __LITTLE_ENDIAN__ 32724 #define vst4_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 32725 uint8x8x4_t __s1 = __p1; \ 32726 __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 16); \ 32727 }) 32728 #else 32729 #define vst4_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 32730 uint8x8x4_t __s1 = __p1; \ 32731 uint8x8x4_t __rev1; \ 32732 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 32733 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 32734 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 32735 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 32736 __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 16); \ 32737 }) 32738 #endif 32739 32740 #ifdef __LITTLE_ENDIAN__ 32741 #define vst4_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 32742 uint32x2x4_t __s1 = __p1; \ 32743 __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 18); \ 32744 }) 32745 #else 32746 #define vst4_lane_u32(__p0, __p1, __p2) __extension__ ({ \ 32747 uint32x2x4_t __s1 = __p1; \ 32748 uint32x2x4_t __rev1; \ 32749 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 32750 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 32751 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 32752 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \ 32753 __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 18); \ 32754 }) 32755 #endif 32756 32757 #ifdef __LITTLE_ENDIAN__ 32758 #define vst4_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 32759 uint16x4x4_t __s1 = __p1; \ 32760 __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 17); \ 32761 }) 32762 #else 32763 #define vst4_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 32764 uint16x4x4_t __s1 = __p1; \ 32765 uint16x4x4_t __rev1; \ 32766 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 32767 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 32768 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 32769 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \ 32770 __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 17); \ 32771 }) 32772 #endif 32773 32774 #ifdef __LITTLE_ENDIAN__ 32775 #define vst4_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 32776 int8x8x4_t __s1 = __p1; \ 32777 __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 0); \ 32778 }) 32779 #else 32780 #define vst4_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 32781 int8x8x4_t __s1 = __p1; \ 32782 int8x8x4_t __rev1; \ 32783 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 32784 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 32785 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 32786 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 32787 __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 0); \ 32788 }) 32789 #endif 32790 32791 #ifdef __LITTLE_ENDIAN__ 32792 #define vst4_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 32793 float32x2x4_t __s1 = __p1; \ 32794 __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 9); \ 32795 }) 32796 #else 32797 #define vst4_lane_f32(__p0, __p1, __p2) __extension__ ({ \ 32798 float32x2x4_t __s1 = __p1; \ 32799 float32x2x4_t __rev1; \ 32800 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 32801 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 32802 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 32803 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \ 32804 __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 9); \ 32805 }) 32806 #endif 32807 32808 #ifdef __LITTLE_ENDIAN__ 32809 #define vst4_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 32810 int32x2x4_t __s1 = __p1; \ 32811 __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 2); \ 32812 }) 32813 #else 32814 #define vst4_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 32815 int32x2x4_t __s1 = __p1; \ 32816 int32x2x4_t __rev1; \ 32817 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 32818 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 32819 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 32820 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \ 32821 __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 2); \ 32822 }) 32823 #endif 32824 32825 #ifdef __LITTLE_ENDIAN__ 32826 #define vst4_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 32827 int16x4x4_t __s1 = __p1; \ 32828 __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 1); \ 32829 }) 32830 #else 32831 #define vst4_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 32832 int16x4x4_t __s1 = __p1; \ 32833 int16x4x4_t __rev1; \ 32834 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 32835 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 32836 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 32837 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \ 32838 __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 1); \ 32839 }) 32840 #endif 32841 32842 #ifdef __LITTLE_ENDIAN__ 32843 __ai __attribute__((target("neon"))) uint8x16_t vsubq_u8(uint8x16_t __p0, uint8x16_t __p1) { 32844 uint8x16_t __ret; 32845 __ret = __p0 - __p1; 32846 return __ret; 32847 } 32848 #else 32849 __ai __attribute__((target("neon"))) uint8x16_t vsubq_u8(uint8x16_t __p0, uint8x16_t __p1) { 32850 uint8x16_t __ret; 32851 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 32852 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 32853 __ret = __rev0 - __rev1; 32854 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 32855 return __ret; 32856 } 32857 #endif 32858 32859 #ifdef __LITTLE_ENDIAN__ 32860 __ai __attribute__((target("neon"))) uint32x4_t vsubq_u32(uint32x4_t __p0, uint32x4_t __p1) { 32861 uint32x4_t __ret; 32862 __ret = __p0 - __p1; 32863 return __ret; 32864 } 32865 #else 32866 __ai __attribute__((target("neon"))) uint32x4_t vsubq_u32(uint32x4_t __p0, uint32x4_t __p1) { 32867 uint32x4_t __ret; 32868 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 32869 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 32870 __ret = __rev0 - __rev1; 32871 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 32872 return __ret; 32873 } 32874 #endif 32875 32876 #ifdef __LITTLE_ENDIAN__ 32877 __ai __attribute__((target("neon"))) uint64x2_t vsubq_u64(uint64x2_t __p0, uint64x2_t __p1) { 32878 uint64x2_t __ret; 32879 __ret = __p0 - __p1; 32880 return __ret; 32881 } 32882 #else 32883 __ai __attribute__((target("neon"))) uint64x2_t vsubq_u64(uint64x2_t __p0, uint64x2_t __p1) { 32884 uint64x2_t __ret; 32885 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 32886 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 32887 __ret = __rev0 - __rev1; 32888 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 32889 return __ret; 32890 } 32891 #endif 32892 32893 #ifdef __LITTLE_ENDIAN__ 32894 __ai __attribute__((target("neon"))) uint16x8_t vsubq_u16(uint16x8_t __p0, uint16x8_t __p1) { 32895 uint16x8_t __ret; 32896 __ret = __p0 - __p1; 32897 return __ret; 32898 } 32899 #else 32900 __ai __attribute__((target("neon"))) uint16x8_t vsubq_u16(uint16x8_t __p0, uint16x8_t __p1) { 32901 uint16x8_t __ret; 32902 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 32903 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 32904 __ret = __rev0 - __rev1; 32905 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 32906 return __ret; 32907 } 32908 #endif 32909 32910 #ifdef __LITTLE_ENDIAN__ 32911 __ai __attribute__((target("neon"))) int8x16_t vsubq_s8(int8x16_t __p0, int8x16_t __p1) { 32912 int8x16_t __ret; 32913 __ret = __p0 - __p1; 32914 return __ret; 32915 } 32916 #else 32917 __ai __attribute__((target("neon"))) int8x16_t vsubq_s8(int8x16_t __p0, int8x16_t __p1) { 32918 int8x16_t __ret; 32919 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 32920 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 32921 __ret = __rev0 - __rev1; 32922 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 32923 return __ret; 32924 } 32925 #endif 32926 32927 #ifdef __LITTLE_ENDIAN__ 32928 __ai __attribute__((target("neon"))) float32x4_t vsubq_f32(float32x4_t __p0, float32x4_t __p1) { 32929 float32x4_t __ret; 32930 __ret = __p0 - __p1; 32931 return __ret; 32932 } 32933 #else 32934 __ai __attribute__((target("neon"))) float32x4_t vsubq_f32(float32x4_t __p0, float32x4_t __p1) { 32935 float32x4_t __ret; 32936 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 32937 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 32938 __ret = __rev0 - __rev1; 32939 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 32940 return __ret; 32941 } 32942 #endif 32943 32944 #ifdef __LITTLE_ENDIAN__ 32945 __ai __attribute__((target("neon"))) int32x4_t vsubq_s32(int32x4_t __p0, int32x4_t __p1) { 32946 int32x4_t __ret; 32947 __ret = __p0 - __p1; 32948 return __ret; 32949 } 32950 #else 32951 __ai __attribute__((target("neon"))) int32x4_t vsubq_s32(int32x4_t __p0, int32x4_t __p1) { 32952 int32x4_t __ret; 32953 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 32954 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 32955 __ret = __rev0 - __rev1; 32956 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 32957 return __ret; 32958 } 32959 #endif 32960 32961 #ifdef __LITTLE_ENDIAN__ 32962 __ai __attribute__((target("neon"))) int64x2_t vsubq_s64(int64x2_t __p0, int64x2_t __p1) { 32963 int64x2_t __ret; 32964 __ret = __p0 - __p1; 32965 return __ret; 32966 } 32967 #else 32968 __ai __attribute__((target("neon"))) int64x2_t vsubq_s64(int64x2_t __p0, int64x2_t __p1) { 32969 int64x2_t __ret; 32970 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 32971 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 32972 __ret = __rev0 - __rev1; 32973 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 32974 return __ret; 32975 } 32976 #endif 32977 32978 #ifdef __LITTLE_ENDIAN__ 32979 __ai __attribute__((target("neon"))) int16x8_t vsubq_s16(int16x8_t __p0, int16x8_t __p1) { 32980 int16x8_t __ret; 32981 __ret = __p0 - __p1; 32982 return __ret; 32983 } 32984 #else 32985 __ai __attribute__((target("neon"))) int16x8_t vsubq_s16(int16x8_t __p0, int16x8_t __p1) { 32986 int16x8_t __ret; 32987 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 32988 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 32989 __ret = __rev0 - __rev1; 32990 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 32991 return __ret; 32992 } 32993 #endif 32994 32995 #ifdef __LITTLE_ENDIAN__ 32996 __ai __attribute__((target("neon"))) uint8x8_t vsub_u8(uint8x8_t __p0, uint8x8_t __p1) { 32997 uint8x8_t __ret; 32998 __ret = __p0 - __p1; 32999 return __ret; 33000 } 33001 #else 33002 __ai __attribute__((target("neon"))) uint8x8_t vsub_u8(uint8x8_t __p0, uint8x8_t __p1) { 33003 uint8x8_t __ret; 33004 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 33005 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 33006 __ret = __rev0 - __rev1; 33007 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 33008 return __ret; 33009 } 33010 #endif 33011 33012 #ifdef __LITTLE_ENDIAN__ 33013 __ai __attribute__((target("neon"))) uint32x2_t vsub_u32(uint32x2_t __p0, uint32x2_t __p1) { 33014 uint32x2_t __ret; 33015 __ret = __p0 - __p1; 33016 return __ret; 33017 } 33018 #else 33019 __ai __attribute__((target("neon"))) uint32x2_t vsub_u32(uint32x2_t __p0, uint32x2_t __p1) { 33020 uint32x2_t __ret; 33021 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 33022 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 33023 __ret = __rev0 - __rev1; 33024 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 33025 return __ret; 33026 } 33027 #endif 33028 33029 __ai __attribute__((target("neon"))) uint64x1_t vsub_u64(uint64x1_t __p0, uint64x1_t __p1) { 33030 uint64x1_t __ret; 33031 __ret = __p0 - __p1; 33032 return __ret; 33033 } 33034 #ifdef __LITTLE_ENDIAN__ 33035 __ai __attribute__((target("neon"))) uint16x4_t vsub_u16(uint16x4_t __p0, uint16x4_t __p1) { 33036 uint16x4_t __ret; 33037 __ret = __p0 - __p1; 33038 return __ret; 33039 } 33040 #else 33041 __ai __attribute__((target("neon"))) uint16x4_t vsub_u16(uint16x4_t __p0, uint16x4_t __p1) { 33042 uint16x4_t __ret; 33043 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 33044 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 33045 __ret = __rev0 - __rev1; 33046 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 33047 return __ret; 33048 } 33049 #endif 33050 33051 #ifdef __LITTLE_ENDIAN__ 33052 __ai __attribute__((target("neon"))) int8x8_t vsub_s8(int8x8_t __p0, int8x8_t __p1) { 33053 int8x8_t __ret; 33054 __ret = __p0 - __p1; 33055 return __ret; 33056 } 33057 #else 33058 __ai __attribute__((target("neon"))) int8x8_t vsub_s8(int8x8_t __p0, int8x8_t __p1) { 33059 int8x8_t __ret; 33060 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 33061 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 33062 __ret = __rev0 - __rev1; 33063 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 33064 return __ret; 33065 } 33066 #endif 33067 33068 #ifdef __LITTLE_ENDIAN__ 33069 __ai __attribute__((target("neon"))) float32x2_t vsub_f32(float32x2_t __p0, float32x2_t __p1) { 33070 float32x2_t __ret; 33071 __ret = __p0 - __p1; 33072 return __ret; 33073 } 33074 #else 33075 __ai __attribute__((target("neon"))) float32x2_t vsub_f32(float32x2_t __p0, float32x2_t __p1) { 33076 float32x2_t __ret; 33077 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 33078 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 33079 __ret = __rev0 - __rev1; 33080 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 33081 return __ret; 33082 } 33083 #endif 33084 33085 #ifdef __LITTLE_ENDIAN__ 33086 __ai __attribute__((target("neon"))) int32x2_t vsub_s32(int32x2_t __p0, int32x2_t __p1) { 33087 int32x2_t __ret; 33088 __ret = __p0 - __p1; 33089 return __ret; 33090 } 33091 #else 33092 __ai __attribute__((target("neon"))) int32x2_t vsub_s32(int32x2_t __p0, int32x2_t __p1) { 33093 int32x2_t __ret; 33094 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 33095 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 33096 __ret = __rev0 - __rev1; 33097 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 33098 return __ret; 33099 } 33100 #endif 33101 33102 __ai __attribute__((target("neon"))) int64x1_t vsub_s64(int64x1_t __p0, int64x1_t __p1) { 33103 int64x1_t __ret; 33104 __ret = __p0 - __p1; 33105 return __ret; 33106 } 33107 #ifdef __LITTLE_ENDIAN__ 33108 __ai __attribute__((target("neon"))) int16x4_t vsub_s16(int16x4_t __p0, int16x4_t __p1) { 33109 int16x4_t __ret; 33110 __ret = __p0 - __p1; 33111 return __ret; 33112 } 33113 #else 33114 __ai __attribute__((target("neon"))) int16x4_t vsub_s16(int16x4_t __p0, int16x4_t __p1) { 33115 int16x4_t __ret; 33116 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 33117 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 33118 __ret = __rev0 - __rev1; 33119 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 33120 return __ret; 33121 } 33122 #endif 33123 33124 #ifdef __LITTLE_ENDIAN__ 33125 __ai __attribute__((target("neon"))) uint16x4_t vsubhn_u32(uint32x4_t __p0, uint32x4_t __p1) { 33126 uint16x4_t __ret; 33127 __ret = (uint16x4_t) __builtin_neon_vsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 17); 33128 return __ret; 33129 } 33130 #else 33131 __ai __attribute__((target("neon"))) uint16x4_t vsubhn_u32(uint32x4_t __p0, uint32x4_t __p1) { 33132 uint16x4_t __ret; 33133 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 33134 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 33135 __ret = (uint16x4_t) __builtin_neon_vsubhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 17); 33136 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 33137 return __ret; 33138 } 33139 __ai __attribute__((target("neon"))) uint16x4_t __noswap_vsubhn_u32(uint32x4_t __p0, uint32x4_t __p1) { 33140 uint16x4_t __ret; 33141 __ret = (uint16x4_t) __builtin_neon_vsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 17); 33142 return __ret; 33143 } 33144 #endif 33145 33146 #ifdef __LITTLE_ENDIAN__ 33147 __ai __attribute__((target("neon"))) uint32x2_t vsubhn_u64(uint64x2_t __p0, uint64x2_t __p1) { 33148 uint32x2_t __ret; 33149 __ret = (uint32x2_t) __builtin_neon_vsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 18); 33150 return __ret; 33151 } 33152 #else 33153 __ai __attribute__((target("neon"))) uint32x2_t vsubhn_u64(uint64x2_t __p0, uint64x2_t __p1) { 33154 uint32x2_t __ret; 33155 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 33156 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 33157 __ret = (uint32x2_t) __builtin_neon_vsubhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 18); 33158 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 33159 return __ret; 33160 } 33161 __ai __attribute__((target("neon"))) uint32x2_t __noswap_vsubhn_u64(uint64x2_t __p0, uint64x2_t __p1) { 33162 uint32x2_t __ret; 33163 __ret = (uint32x2_t) __builtin_neon_vsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 18); 33164 return __ret; 33165 } 33166 #endif 33167 33168 #ifdef __LITTLE_ENDIAN__ 33169 __ai __attribute__((target("neon"))) uint8x8_t vsubhn_u16(uint16x8_t __p0, uint16x8_t __p1) { 33170 uint8x8_t __ret; 33171 __ret = (uint8x8_t) __builtin_neon_vsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 16); 33172 return __ret; 33173 } 33174 #else 33175 __ai __attribute__((target("neon"))) uint8x8_t vsubhn_u16(uint16x8_t __p0, uint16x8_t __p1) { 33176 uint8x8_t __ret; 33177 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 33178 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 33179 __ret = (uint8x8_t) __builtin_neon_vsubhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 16); 33180 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 33181 return __ret; 33182 } 33183 __ai __attribute__((target("neon"))) uint8x8_t __noswap_vsubhn_u16(uint16x8_t __p0, uint16x8_t __p1) { 33184 uint8x8_t __ret; 33185 __ret = (uint8x8_t) __builtin_neon_vsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 16); 33186 return __ret; 33187 } 33188 #endif 33189 33190 #ifdef __LITTLE_ENDIAN__ 33191 __ai __attribute__((target("neon"))) int16x4_t vsubhn_s32(int32x4_t __p0, int32x4_t __p1) { 33192 int16x4_t __ret; 33193 __ret = (int16x4_t) __builtin_neon_vsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 1); 33194 return __ret; 33195 } 33196 #else 33197 __ai __attribute__((target("neon"))) int16x4_t vsubhn_s32(int32x4_t __p0, int32x4_t __p1) { 33198 int16x4_t __ret; 33199 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 33200 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 33201 __ret = (int16x4_t) __builtin_neon_vsubhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 1); 33202 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 33203 return __ret; 33204 } 33205 __ai __attribute__((target("neon"))) int16x4_t __noswap_vsubhn_s32(int32x4_t __p0, int32x4_t __p1) { 33206 int16x4_t __ret; 33207 __ret = (int16x4_t) __builtin_neon_vsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 1); 33208 return __ret; 33209 } 33210 #endif 33211 33212 #ifdef __LITTLE_ENDIAN__ 33213 __ai __attribute__((target("neon"))) int32x2_t vsubhn_s64(int64x2_t __p0, int64x2_t __p1) { 33214 int32x2_t __ret; 33215 __ret = (int32x2_t) __builtin_neon_vsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 2); 33216 return __ret; 33217 } 33218 #else 33219 __ai __attribute__((target("neon"))) int32x2_t vsubhn_s64(int64x2_t __p0, int64x2_t __p1) { 33220 int32x2_t __ret; 33221 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 33222 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 33223 __ret = (int32x2_t) __builtin_neon_vsubhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 2); 33224 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 33225 return __ret; 33226 } 33227 __ai __attribute__((target("neon"))) int32x2_t __noswap_vsubhn_s64(int64x2_t __p0, int64x2_t __p1) { 33228 int32x2_t __ret; 33229 __ret = (int32x2_t) __builtin_neon_vsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 2); 33230 return __ret; 33231 } 33232 #endif 33233 33234 #ifdef __LITTLE_ENDIAN__ 33235 __ai __attribute__((target("neon"))) int8x8_t vsubhn_s16(int16x8_t __p0, int16x8_t __p1) { 33236 int8x8_t __ret; 33237 __ret = (int8x8_t) __builtin_neon_vsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 0); 33238 return __ret; 33239 } 33240 #else 33241 __ai __attribute__((target("neon"))) int8x8_t vsubhn_s16(int16x8_t __p0, int16x8_t __p1) { 33242 int8x8_t __ret; 33243 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 33244 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 33245 __ret = (int8x8_t) __builtin_neon_vsubhn_v((int8x16_t)__rev0, (int8x16_t)__rev1, 0); 33246 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 33247 return __ret; 33248 } 33249 __ai __attribute__((target("neon"))) int8x8_t __noswap_vsubhn_s16(int16x8_t __p0, int16x8_t __p1) { 33250 int8x8_t __ret; 33251 __ret = (int8x8_t) __builtin_neon_vsubhn_v((int8x16_t)__p0, (int8x16_t)__p1, 0); 33252 return __ret; 33253 } 33254 #endif 33255 33256 #ifdef __LITTLE_ENDIAN__ 33257 __ai __attribute__((target("neon"))) uint16x8_t vsubl_u8(uint8x8_t __p0, uint8x8_t __p1) { 33258 uint16x8_t __ret; 33259 __ret = vmovl_u8(__p0) - vmovl_u8(__p1); 33260 return __ret; 33261 } 33262 #else 33263 __ai __attribute__((target("neon"))) uint16x8_t vsubl_u8(uint8x8_t __p0, uint8x8_t __p1) { 33264 uint16x8_t __ret; 33265 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 33266 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 33267 __ret = __noswap_vmovl_u8(__rev0) - __noswap_vmovl_u8(__rev1); 33268 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 33269 return __ret; 33270 } 33271 #endif 33272 33273 #ifdef __LITTLE_ENDIAN__ 33274 __ai __attribute__((target("neon"))) uint64x2_t vsubl_u32(uint32x2_t __p0, uint32x2_t __p1) { 33275 uint64x2_t __ret; 33276 __ret = vmovl_u32(__p0) - vmovl_u32(__p1); 33277 return __ret; 33278 } 33279 #else 33280 __ai __attribute__((target("neon"))) uint64x2_t vsubl_u32(uint32x2_t __p0, uint32x2_t __p1) { 33281 uint64x2_t __ret; 33282 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 33283 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 33284 __ret = __noswap_vmovl_u32(__rev0) - __noswap_vmovl_u32(__rev1); 33285 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 33286 return __ret; 33287 } 33288 #endif 33289 33290 #ifdef __LITTLE_ENDIAN__ 33291 __ai __attribute__((target("neon"))) uint32x4_t vsubl_u16(uint16x4_t __p0, uint16x4_t __p1) { 33292 uint32x4_t __ret; 33293 __ret = vmovl_u16(__p0) - vmovl_u16(__p1); 33294 return __ret; 33295 } 33296 #else 33297 __ai __attribute__((target("neon"))) uint32x4_t vsubl_u16(uint16x4_t __p0, uint16x4_t __p1) { 33298 uint32x4_t __ret; 33299 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 33300 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 33301 __ret = __noswap_vmovl_u16(__rev0) - __noswap_vmovl_u16(__rev1); 33302 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 33303 return __ret; 33304 } 33305 #endif 33306 33307 #ifdef __LITTLE_ENDIAN__ 33308 __ai __attribute__((target("neon"))) int16x8_t vsubl_s8(int8x8_t __p0, int8x8_t __p1) { 33309 int16x8_t __ret; 33310 __ret = vmovl_s8(__p0) - vmovl_s8(__p1); 33311 return __ret; 33312 } 33313 #else 33314 __ai __attribute__((target("neon"))) int16x8_t vsubl_s8(int8x8_t __p0, int8x8_t __p1) { 33315 int16x8_t __ret; 33316 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 33317 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 33318 __ret = __noswap_vmovl_s8(__rev0) - __noswap_vmovl_s8(__rev1); 33319 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 33320 return __ret; 33321 } 33322 #endif 33323 33324 #ifdef __LITTLE_ENDIAN__ 33325 __ai __attribute__((target("neon"))) int64x2_t vsubl_s32(int32x2_t __p0, int32x2_t __p1) { 33326 int64x2_t __ret; 33327 __ret = vmovl_s32(__p0) - vmovl_s32(__p1); 33328 return __ret; 33329 } 33330 #else 33331 __ai __attribute__((target("neon"))) int64x2_t vsubl_s32(int32x2_t __p0, int32x2_t __p1) { 33332 int64x2_t __ret; 33333 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 33334 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 33335 __ret = __noswap_vmovl_s32(__rev0) - __noswap_vmovl_s32(__rev1); 33336 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 33337 return __ret; 33338 } 33339 #endif 33340 33341 #ifdef __LITTLE_ENDIAN__ 33342 __ai __attribute__((target("neon"))) int32x4_t vsubl_s16(int16x4_t __p0, int16x4_t __p1) { 33343 int32x4_t __ret; 33344 __ret = vmovl_s16(__p0) - vmovl_s16(__p1); 33345 return __ret; 33346 } 33347 #else 33348 __ai __attribute__((target("neon"))) int32x4_t vsubl_s16(int16x4_t __p0, int16x4_t __p1) { 33349 int32x4_t __ret; 33350 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 33351 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 33352 __ret = __noswap_vmovl_s16(__rev0) - __noswap_vmovl_s16(__rev1); 33353 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 33354 return __ret; 33355 } 33356 #endif 33357 33358 #ifdef __LITTLE_ENDIAN__ 33359 __ai __attribute__((target("neon"))) uint16x8_t vsubw_u8(uint16x8_t __p0, uint8x8_t __p1) { 33360 uint16x8_t __ret; 33361 __ret = __p0 - vmovl_u8(__p1); 33362 return __ret; 33363 } 33364 #else 33365 __ai __attribute__((target("neon"))) uint16x8_t vsubw_u8(uint16x8_t __p0, uint8x8_t __p1) { 33366 uint16x8_t __ret; 33367 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 33368 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 33369 __ret = __rev0 - __noswap_vmovl_u8(__rev1); 33370 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 33371 return __ret; 33372 } 33373 #endif 33374 33375 #ifdef __LITTLE_ENDIAN__ 33376 __ai __attribute__((target("neon"))) uint64x2_t vsubw_u32(uint64x2_t __p0, uint32x2_t __p1) { 33377 uint64x2_t __ret; 33378 __ret = __p0 - vmovl_u32(__p1); 33379 return __ret; 33380 } 33381 #else 33382 __ai __attribute__((target("neon"))) uint64x2_t vsubw_u32(uint64x2_t __p0, uint32x2_t __p1) { 33383 uint64x2_t __ret; 33384 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 33385 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 33386 __ret = __rev0 - __noswap_vmovl_u32(__rev1); 33387 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 33388 return __ret; 33389 } 33390 #endif 33391 33392 #ifdef __LITTLE_ENDIAN__ 33393 __ai __attribute__((target("neon"))) uint32x4_t vsubw_u16(uint32x4_t __p0, uint16x4_t __p1) { 33394 uint32x4_t __ret; 33395 __ret = __p0 - vmovl_u16(__p1); 33396 return __ret; 33397 } 33398 #else 33399 __ai __attribute__((target("neon"))) uint32x4_t vsubw_u16(uint32x4_t __p0, uint16x4_t __p1) { 33400 uint32x4_t __ret; 33401 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 33402 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 33403 __ret = __rev0 - __noswap_vmovl_u16(__rev1); 33404 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 33405 return __ret; 33406 } 33407 #endif 33408 33409 #ifdef __LITTLE_ENDIAN__ 33410 __ai __attribute__((target("neon"))) int16x8_t vsubw_s8(int16x8_t __p0, int8x8_t __p1) { 33411 int16x8_t __ret; 33412 __ret = __p0 - vmovl_s8(__p1); 33413 return __ret; 33414 } 33415 #else 33416 __ai __attribute__((target("neon"))) int16x8_t vsubw_s8(int16x8_t __p0, int8x8_t __p1) { 33417 int16x8_t __ret; 33418 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 33419 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 33420 __ret = __rev0 - __noswap_vmovl_s8(__rev1); 33421 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 33422 return __ret; 33423 } 33424 #endif 33425 33426 #ifdef __LITTLE_ENDIAN__ 33427 __ai __attribute__((target("neon"))) int64x2_t vsubw_s32(int64x2_t __p0, int32x2_t __p1) { 33428 int64x2_t __ret; 33429 __ret = __p0 - vmovl_s32(__p1); 33430 return __ret; 33431 } 33432 #else 33433 __ai __attribute__((target("neon"))) int64x2_t vsubw_s32(int64x2_t __p0, int32x2_t __p1) { 33434 int64x2_t __ret; 33435 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 33436 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 33437 __ret = __rev0 - __noswap_vmovl_s32(__rev1); 33438 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 33439 return __ret; 33440 } 33441 #endif 33442 33443 #ifdef __LITTLE_ENDIAN__ 33444 __ai __attribute__((target("neon"))) int32x4_t vsubw_s16(int32x4_t __p0, int16x4_t __p1) { 33445 int32x4_t __ret; 33446 __ret = __p0 - vmovl_s16(__p1); 33447 return __ret; 33448 } 33449 #else 33450 __ai __attribute__((target("neon"))) int32x4_t vsubw_s16(int32x4_t __p0, int16x4_t __p1) { 33451 int32x4_t __ret; 33452 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 33453 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 33454 __ret = __rev0 - __noswap_vmovl_s16(__rev1); 33455 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 33456 return __ret; 33457 } 33458 #endif 33459 33460 #ifdef __LITTLE_ENDIAN__ 33461 __ai __attribute__((target("neon"))) poly8x8_t vtbl1_p8(poly8x8_t __p0, uint8x8_t __p1) { 33462 poly8x8_t __ret; 33463 __ret = (poly8x8_t) __builtin_neon_vtbl1_v((int8x8_t)__p0, (int8x8_t)__p1, 4); 33464 return __ret; 33465 } 33466 #else 33467 __ai __attribute__((target("neon"))) poly8x8_t vtbl1_p8(poly8x8_t __p0, uint8x8_t __p1) { 33468 poly8x8_t __ret; 33469 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 33470 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 33471 __ret = (poly8x8_t) __builtin_neon_vtbl1_v((int8x8_t)__rev0, (int8x8_t)__rev1, 4); 33472 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 33473 return __ret; 33474 } 33475 #endif 33476 33477 #ifdef __LITTLE_ENDIAN__ 33478 __ai __attribute__((target("neon"))) uint8x8_t vtbl1_u8(uint8x8_t __p0, uint8x8_t __p1) { 33479 uint8x8_t __ret; 33480 __ret = (uint8x8_t) __builtin_neon_vtbl1_v((int8x8_t)__p0, (int8x8_t)__p1, 16); 33481 return __ret; 33482 } 33483 #else 33484 __ai __attribute__((target("neon"))) uint8x8_t vtbl1_u8(uint8x8_t __p0, uint8x8_t __p1) { 33485 uint8x8_t __ret; 33486 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 33487 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 33488 __ret = (uint8x8_t) __builtin_neon_vtbl1_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16); 33489 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 33490 return __ret; 33491 } 33492 #endif 33493 33494 #ifdef __LITTLE_ENDIAN__ 33495 __ai __attribute__((target("neon"))) int8x8_t vtbl1_s8(int8x8_t __p0, int8x8_t __p1) { 33496 int8x8_t __ret; 33497 __ret = (int8x8_t) __builtin_neon_vtbl1_v((int8x8_t)__p0, (int8x8_t)__p1, 0); 33498 return __ret; 33499 } 33500 #else 33501 __ai __attribute__((target("neon"))) int8x8_t vtbl1_s8(int8x8_t __p0, int8x8_t __p1) { 33502 int8x8_t __ret; 33503 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 33504 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 33505 __ret = (int8x8_t) __builtin_neon_vtbl1_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0); 33506 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 33507 return __ret; 33508 } 33509 #endif 33510 33511 #ifdef __LITTLE_ENDIAN__ 33512 __ai __attribute__((target("neon"))) poly8x8_t vtbl2_p8(poly8x8x2_t __p0, uint8x8_t __p1) { 33513 poly8x8_t __ret; 33514 __ret = (poly8x8_t) __builtin_neon_vtbl2_v((int8x8_t)__p0.val[0], (int8x8_t)__p0.val[1], (int8x8_t)__p1, 4); 33515 return __ret; 33516 } 33517 #else 33518 __ai __attribute__((target("neon"))) poly8x8_t vtbl2_p8(poly8x8x2_t __p0, uint8x8_t __p1) { 33519 poly8x8_t __ret; 33520 poly8x8x2_t __rev0; 33521 __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 33522 __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 33523 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 33524 __ret = (poly8x8_t) __builtin_neon_vtbl2_v((int8x8_t)__rev0.val[0], (int8x8_t)__rev0.val[1], (int8x8_t)__rev1, 4); 33525 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 33526 return __ret; 33527 } 33528 #endif 33529 33530 #ifdef __LITTLE_ENDIAN__ 33531 __ai __attribute__((target("neon"))) uint8x8_t vtbl2_u8(uint8x8x2_t __p0, uint8x8_t __p1) { 33532 uint8x8_t __ret; 33533 __ret = (uint8x8_t) __builtin_neon_vtbl2_v((int8x8_t)__p0.val[0], (int8x8_t)__p0.val[1], (int8x8_t)__p1, 16); 33534 return __ret; 33535 } 33536 #else 33537 __ai __attribute__((target("neon"))) uint8x8_t vtbl2_u8(uint8x8x2_t __p0, uint8x8_t __p1) { 33538 uint8x8_t __ret; 33539 uint8x8x2_t __rev0; 33540 __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 33541 __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 33542 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 33543 __ret = (uint8x8_t) __builtin_neon_vtbl2_v((int8x8_t)__rev0.val[0], (int8x8_t)__rev0.val[1], (int8x8_t)__rev1, 16); 33544 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 33545 return __ret; 33546 } 33547 #endif 33548 33549 #ifdef __LITTLE_ENDIAN__ 33550 __ai __attribute__((target("neon"))) int8x8_t vtbl2_s8(int8x8x2_t __p0, int8x8_t __p1) { 33551 int8x8_t __ret; 33552 __ret = (int8x8_t) __builtin_neon_vtbl2_v((int8x8_t)__p0.val[0], (int8x8_t)__p0.val[1], (int8x8_t)__p1, 0); 33553 return __ret; 33554 } 33555 #else 33556 __ai __attribute__((target("neon"))) int8x8_t vtbl2_s8(int8x8x2_t __p0, int8x8_t __p1) { 33557 int8x8_t __ret; 33558 int8x8x2_t __rev0; 33559 __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 33560 __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 33561 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 33562 __ret = (int8x8_t) __builtin_neon_vtbl2_v((int8x8_t)__rev0.val[0], (int8x8_t)__rev0.val[1], (int8x8_t)__rev1, 0); 33563 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 33564 return __ret; 33565 } 33566 #endif 33567 33568 #ifdef __LITTLE_ENDIAN__ 33569 __ai __attribute__((target("neon"))) poly8x8_t vtbl3_p8(poly8x8x3_t __p0, uint8x8_t __p1) { 33570 poly8x8_t __ret; 33571 __ret = (poly8x8_t) __builtin_neon_vtbl3_v((int8x8_t)__p0.val[0], (int8x8_t)__p0.val[1], (int8x8_t)__p0.val[2], (int8x8_t)__p1, 4); 33572 return __ret; 33573 } 33574 #else 33575 __ai __attribute__((target("neon"))) poly8x8_t vtbl3_p8(poly8x8x3_t __p0, uint8x8_t __p1) { 33576 poly8x8_t __ret; 33577 poly8x8x3_t __rev0; 33578 __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 33579 __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 33580 __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 7, 6, 5, 4, 3, 2, 1, 0); 33581 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 33582 __ret = (poly8x8_t) __builtin_neon_vtbl3_v((int8x8_t)__rev0.val[0], (int8x8_t)__rev0.val[1], (int8x8_t)__rev0.val[2], (int8x8_t)__rev1, 4); 33583 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 33584 return __ret; 33585 } 33586 #endif 33587 33588 #ifdef __LITTLE_ENDIAN__ 33589 __ai __attribute__((target("neon"))) uint8x8_t vtbl3_u8(uint8x8x3_t __p0, uint8x8_t __p1) { 33590 uint8x8_t __ret; 33591 __ret = (uint8x8_t) __builtin_neon_vtbl3_v((int8x8_t)__p0.val[0], (int8x8_t)__p0.val[1], (int8x8_t)__p0.val[2], (int8x8_t)__p1, 16); 33592 return __ret; 33593 } 33594 #else 33595 __ai __attribute__((target("neon"))) uint8x8_t vtbl3_u8(uint8x8x3_t __p0, uint8x8_t __p1) { 33596 uint8x8_t __ret; 33597 uint8x8x3_t __rev0; 33598 __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 33599 __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 33600 __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 7, 6, 5, 4, 3, 2, 1, 0); 33601 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 33602 __ret = (uint8x8_t) __builtin_neon_vtbl3_v((int8x8_t)__rev0.val[0], (int8x8_t)__rev0.val[1], (int8x8_t)__rev0.val[2], (int8x8_t)__rev1, 16); 33603 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 33604 return __ret; 33605 } 33606 #endif 33607 33608 #ifdef __LITTLE_ENDIAN__ 33609 __ai __attribute__((target("neon"))) int8x8_t vtbl3_s8(int8x8x3_t __p0, int8x8_t __p1) { 33610 int8x8_t __ret; 33611 __ret = (int8x8_t) __builtin_neon_vtbl3_v((int8x8_t)__p0.val[0], (int8x8_t)__p0.val[1], (int8x8_t)__p0.val[2], (int8x8_t)__p1, 0); 33612 return __ret; 33613 } 33614 #else 33615 __ai __attribute__((target("neon"))) int8x8_t vtbl3_s8(int8x8x3_t __p0, int8x8_t __p1) { 33616 int8x8_t __ret; 33617 int8x8x3_t __rev0; 33618 __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 33619 __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 33620 __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 7, 6, 5, 4, 3, 2, 1, 0); 33621 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 33622 __ret = (int8x8_t) __builtin_neon_vtbl3_v((int8x8_t)__rev0.val[0], (int8x8_t)__rev0.val[1], (int8x8_t)__rev0.val[2], (int8x8_t)__rev1, 0); 33623 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 33624 return __ret; 33625 } 33626 #endif 33627 33628 #ifdef __LITTLE_ENDIAN__ 33629 __ai __attribute__((target("neon"))) poly8x8_t vtbl4_p8(poly8x8x4_t __p0, uint8x8_t __p1) { 33630 poly8x8_t __ret; 33631 __ret = (poly8x8_t) __builtin_neon_vtbl4_v((int8x8_t)__p0.val[0], (int8x8_t)__p0.val[1], (int8x8_t)__p0.val[2], (int8x8_t)__p0.val[3], (int8x8_t)__p1, 4); 33632 return __ret; 33633 } 33634 #else 33635 __ai __attribute__((target("neon"))) poly8x8_t vtbl4_p8(poly8x8x4_t __p0, uint8x8_t __p1) { 33636 poly8x8_t __ret; 33637 poly8x8x4_t __rev0; 33638 __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 33639 __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 33640 __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 7, 6, 5, 4, 3, 2, 1, 0); 33641 __rev0.val[3] = __builtin_shufflevector(__p0.val[3], __p0.val[3], 7, 6, 5, 4, 3, 2, 1, 0); 33642 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 33643 __ret = (poly8x8_t) __builtin_neon_vtbl4_v((int8x8_t)__rev0.val[0], (int8x8_t)__rev0.val[1], (int8x8_t)__rev0.val[2], (int8x8_t)__rev0.val[3], (int8x8_t)__rev1, 4); 33644 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 33645 return __ret; 33646 } 33647 #endif 33648 33649 #ifdef __LITTLE_ENDIAN__ 33650 __ai __attribute__((target("neon"))) uint8x8_t vtbl4_u8(uint8x8x4_t __p0, uint8x8_t __p1) { 33651 uint8x8_t __ret; 33652 __ret = (uint8x8_t) __builtin_neon_vtbl4_v((int8x8_t)__p0.val[0], (int8x8_t)__p0.val[1], (int8x8_t)__p0.val[2], (int8x8_t)__p0.val[3], (int8x8_t)__p1, 16); 33653 return __ret; 33654 } 33655 #else 33656 __ai __attribute__((target("neon"))) uint8x8_t vtbl4_u8(uint8x8x4_t __p0, uint8x8_t __p1) { 33657 uint8x8_t __ret; 33658 uint8x8x4_t __rev0; 33659 __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 33660 __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 33661 __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 7, 6, 5, 4, 3, 2, 1, 0); 33662 __rev0.val[3] = __builtin_shufflevector(__p0.val[3], __p0.val[3], 7, 6, 5, 4, 3, 2, 1, 0); 33663 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 33664 __ret = (uint8x8_t) __builtin_neon_vtbl4_v((int8x8_t)__rev0.val[0], (int8x8_t)__rev0.val[1], (int8x8_t)__rev0.val[2], (int8x8_t)__rev0.val[3], (int8x8_t)__rev1, 16); 33665 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 33666 return __ret; 33667 } 33668 #endif 33669 33670 #ifdef __LITTLE_ENDIAN__ 33671 __ai __attribute__((target("neon"))) int8x8_t vtbl4_s8(int8x8x4_t __p0, int8x8_t __p1) { 33672 int8x8_t __ret; 33673 __ret = (int8x8_t) __builtin_neon_vtbl4_v((int8x8_t)__p0.val[0], (int8x8_t)__p0.val[1], (int8x8_t)__p0.val[2], (int8x8_t)__p0.val[3], (int8x8_t)__p1, 0); 33674 return __ret; 33675 } 33676 #else 33677 __ai __attribute__((target("neon"))) int8x8_t vtbl4_s8(int8x8x4_t __p0, int8x8_t __p1) { 33678 int8x8_t __ret; 33679 int8x8x4_t __rev0; 33680 __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 33681 __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 33682 __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 7, 6, 5, 4, 3, 2, 1, 0); 33683 __rev0.val[3] = __builtin_shufflevector(__p0.val[3], __p0.val[3], 7, 6, 5, 4, 3, 2, 1, 0); 33684 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 33685 __ret = (int8x8_t) __builtin_neon_vtbl4_v((int8x8_t)__rev0.val[0], (int8x8_t)__rev0.val[1], (int8x8_t)__rev0.val[2], (int8x8_t)__rev0.val[3], (int8x8_t)__rev1, 0); 33686 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 33687 return __ret; 33688 } 33689 #endif 33690 33691 #ifdef __LITTLE_ENDIAN__ 33692 __ai __attribute__((target("neon"))) poly8x8_t vtbx1_p8(poly8x8_t __p0, poly8x8_t __p1, uint8x8_t __p2) { 33693 poly8x8_t __ret; 33694 __ret = (poly8x8_t) __builtin_neon_vtbx1_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 4); 33695 return __ret; 33696 } 33697 #else 33698 __ai __attribute__((target("neon"))) poly8x8_t vtbx1_p8(poly8x8_t __p0, poly8x8_t __p1, uint8x8_t __p2) { 33699 poly8x8_t __ret; 33700 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 33701 poly8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 33702 uint8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 33703 __ret = (poly8x8_t) __builtin_neon_vtbx1_v((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 4); 33704 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 33705 return __ret; 33706 } 33707 #endif 33708 33709 #ifdef __LITTLE_ENDIAN__ 33710 __ai __attribute__((target("neon"))) uint8x8_t vtbx1_u8(uint8x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) { 33711 uint8x8_t __ret; 33712 __ret = (uint8x8_t) __builtin_neon_vtbx1_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 16); 33713 return __ret; 33714 } 33715 #else 33716 __ai __attribute__((target("neon"))) uint8x8_t vtbx1_u8(uint8x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) { 33717 uint8x8_t __ret; 33718 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 33719 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 33720 uint8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 33721 __ret = (uint8x8_t) __builtin_neon_vtbx1_v((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 16); 33722 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 33723 return __ret; 33724 } 33725 #endif 33726 33727 #ifdef __LITTLE_ENDIAN__ 33728 __ai __attribute__((target("neon"))) int8x8_t vtbx1_s8(int8x8_t __p0, int8x8_t __p1, int8x8_t __p2) { 33729 int8x8_t __ret; 33730 __ret = (int8x8_t) __builtin_neon_vtbx1_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 0); 33731 return __ret; 33732 } 33733 #else 33734 __ai __attribute__((target("neon"))) int8x8_t vtbx1_s8(int8x8_t __p0, int8x8_t __p1, int8x8_t __p2) { 33735 int8x8_t __ret; 33736 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 33737 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 33738 int8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 33739 __ret = (int8x8_t) __builtin_neon_vtbx1_v((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 0); 33740 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 33741 return __ret; 33742 } 33743 #endif 33744 33745 #ifdef __LITTLE_ENDIAN__ 33746 __ai __attribute__((target("neon"))) poly8x8_t vtbx2_p8(poly8x8_t __p0, poly8x8x2_t __p1, uint8x8_t __p2) { 33747 poly8x8_t __ret; 33748 __ret = (poly8x8_t) __builtin_neon_vtbx2_v((int8x8_t)__p0, (int8x8_t)__p1.val[0], (int8x8_t)__p1.val[1], (int8x8_t)__p2, 4); 33749 return __ret; 33750 } 33751 #else 33752 __ai __attribute__((target("neon"))) poly8x8_t vtbx2_p8(poly8x8_t __p0, poly8x8x2_t __p1, uint8x8_t __p2) { 33753 poly8x8_t __ret; 33754 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 33755 poly8x8x2_t __rev1; 33756 __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 33757 __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 33758 uint8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 33759 __ret = (poly8x8_t) __builtin_neon_vtbx2_v((int8x8_t)__rev0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev2, 4); 33760 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 33761 return __ret; 33762 } 33763 #endif 33764 33765 #ifdef __LITTLE_ENDIAN__ 33766 __ai __attribute__((target("neon"))) uint8x8_t vtbx2_u8(uint8x8_t __p0, uint8x8x2_t __p1, uint8x8_t __p2) { 33767 uint8x8_t __ret; 33768 __ret = (uint8x8_t) __builtin_neon_vtbx2_v((int8x8_t)__p0, (int8x8_t)__p1.val[0], (int8x8_t)__p1.val[1], (int8x8_t)__p2, 16); 33769 return __ret; 33770 } 33771 #else 33772 __ai __attribute__((target("neon"))) uint8x8_t vtbx2_u8(uint8x8_t __p0, uint8x8x2_t __p1, uint8x8_t __p2) { 33773 uint8x8_t __ret; 33774 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 33775 uint8x8x2_t __rev1; 33776 __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 33777 __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 33778 uint8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 33779 __ret = (uint8x8_t) __builtin_neon_vtbx2_v((int8x8_t)__rev0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev2, 16); 33780 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 33781 return __ret; 33782 } 33783 #endif 33784 33785 #ifdef __LITTLE_ENDIAN__ 33786 __ai __attribute__((target("neon"))) int8x8_t vtbx2_s8(int8x8_t __p0, int8x8x2_t __p1, int8x8_t __p2) { 33787 int8x8_t __ret; 33788 __ret = (int8x8_t) __builtin_neon_vtbx2_v((int8x8_t)__p0, (int8x8_t)__p1.val[0], (int8x8_t)__p1.val[1], (int8x8_t)__p2, 0); 33789 return __ret; 33790 } 33791 #else 33792 __ai __attribute__((target("neon"))) int8x8_t vtbx2_s8(int8x8_t __p0, int8x8x2_t __p1, int8x8_t __p2) { 33793 int8x8_t __ret; 33794 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 33795 int8x8x2_t __rev1; 33796 __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 33797 __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 33798 int8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 33799 __ret = (int8x8_t) __builtin_neon_vtbx2_v((int8x8_t)__rev0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev2, 0); 33800 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 33801 return __ret; 33802 } 33803 #endif 33804 33805 #ifdef __LITTLE_ENDIAN__ 33806 __ai __attribute__((target("neon"))) poly8x8_t vtbx3_p8(poly8x8_t __p0, poly8x8x3_t __p1, uint8x8_t __p2) { 33807 poly8x8_t __ret; 33808 __ret = (poly8x8_t) __builtin_neon_vtbx3_v((int8x8_t)__p0, (int8x8_t)__p1.val[0], (int8x8_t)__p1.val[1], (int8x8_t)__p1.val[2], (int8x8_t)__p2, 4); 33809 return __ret; 33810 } 33811 #else 33812 __ai __attribute__((target("neon"))) poly8x8_t vtbx3_p8(poly8x8_t __p0, poly8x8x3_t __p1, uint8x8_t __p2) { 33813 poly8x8_t __ret; 33814 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 33815 poly8x8x3_t __rev1; 33816 __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 33817 __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 33818 __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); 33819 uint8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 33820 __ret = (poly8x8_t) __builtin_neon_vtbx3_v((int8x8_t)__rev0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev2, 4); 33821 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 33822 return __ret; 33823 } 33824 #endif 33825 33826 #ifdef __LITTLE_ENDIAN__ 33827 __ai __attribute__((target("neon"))) uint8x8_t vtbx3_u8(uint8x8_t __p0, uint8x8x3_t __p1, uint8x8_t __p2) { 33828 uint8x8_t __ret; 33829 __ret = (uint8x8_t) __builtin_neon_vtbx3_v((int8x8_t)__p0, (int8x8_t)__p1.val[0], (int8x8_t)__p1.val[1], (int8x8_t)__p1.val[2], (int8x8_t)__p2, 16); 33830 return __ret; 33831 } 33832 #else 33833 __ai __attribute__((target("neon"))) uint8x8_t vtbx3_u8(uint8x8_t __p0, uint8x8x3_t __p1, uint8x8_t __p2) { 33834 uint8x8_t __ret; 33835 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 33836 uint8x8x3_t __rev1; 33837 __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 33838 __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 33839 __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); 33840 uint8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 33841 __ret = (uint8x8_t) __builtin_neon_vtbx3_v((int8x8_t)__rev0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev2, 16); 33842 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 33843 return __ret; 33844 } 33845 #endif 33846 33847 #ifdef __LITTLE_ENDIAN__ 33848 __ai __attribute__((target("neon"))) int8x8_t vtbx3_s8(int8x8_t __p0, int8x8x3_t __p1, int8x8_t __p2) { 33849 int8x8_t __ret; 33850 __ret = (int8x8_t) __builtin_neon_vtbx3_v((int8x8_t)__p0, (int8x8_t)__p1.val[0], (int8x8_t)__p1.val[1], (int8x8_t)__p1.val[2], (int8x8_t)__p2, 0); 33851 return __ret; 33852 } 33853 #else 33854 __ai __attribute__((target("neon"))) int8x8_t vtbx3_s8(int8x8_t __p0, int8x8x3_t __p1, int8x8_t __p2) { 33855 int8x8_t __ret; 33856 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 33857 int8x8x3_t __rev1; 33858 __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 33859 __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 33860 __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); 33861 int8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 33862 __ret = (int8x8_t) __builtin_neon_vtbx3_v((int8x8_t)__rev0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev2, 0); 33863 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 33864 return __ret; 33865 } 33866 #endif 33867 33868 #ifdef __LITTLE_ENDIAN__ 33869 __ai __attribute__((target("neon"))) poly8x8_t vtbx4_p8(poly8x8_t __p0, poly8x8x4_t __p1, uint8x8_t __p2) { 33870 poly8x8_t __ret; 33871 __ret = (poly8x8_t) __builtin_neon_vtbx4_v((int8x8_t)__p0, (int8x8_t)__p1.val[0], (int8x8_t)__p1.val[1], (int8x8_t)__p1.val[2], (int8x8_t)__p1.val[3], (int8x8_t)__p2, 4); 33872 return __ret; 33873 } 33874 #else 33875 __ai __attribute__((target("neon"))) poly8x8_t vtbx4_p8(poly8x8_t __p0, poly8x8x4_t __p1, uint8x8_t __p2) { 33876 poly8x8_t __ret; 33877 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 33878 poly8x8x4_t __rev1; 33879 __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 33880 __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 33881 __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); 33882 __rev1.val[3] = __builtin_shufflevector(__p1.val[3], __p1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); 33883 uint8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 33884 __ret = (poly8x8_t) __builtin_neon_vtbx4_v((int8x8_t)__rev0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], (int8x8_t)__rev2, 4); 33885 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 33886 return __ret; 33887 } 33888 #endif 33889 33890 #ifdef __LITTLE_ENDIAN__ 33891 __ai __attribute__((target("neon"))) uint8x8_t vtbx4_u8(uint8x8_t __p0, uint8x8x4_t __p1, uint8x8_t __p2) { 33892 uint8x8_t __ret; 33893 __ret = (uint8x8_t) __builtin_neon_vtbx4_v((int8x8_t)__p0, (int8x8_t)__p1.val[0], (int8x8_t)__p1.val[1], (int8x8_t)__p1.val[2], (int8x8_t)__p1.val[3], (int8x8_t)__p2, 16); 33894 return __ret; 33895 } 33896 #else 33897 __ai __attribute__((target("neon"))) uint8x8_t vtbx4_u8(uint8x8_t __p0, uint8x8x4_t __p1, uint8x8_t __p2) { 33898 uint8x8_t __ret; 33899 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 33900 uint8x8x4_t __rev1; 33901 __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 33902 __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 33903 __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); 33904 __rev1.val[3] = __builtin_shufflevector(__p1.val[3], __p1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); 33905 uint8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 33906 __ret = (uint8x8_t) __builtin_neon_vtbx4_v((int8x8_t)__rev0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], (int8x8_t)__rev2, 16); 33907 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 33908 return __ret; 33909 } 33910 #endif 33911 33912 #ifdef __LITTLE_ENDIAN__ 33913 __ai __attribute__((target("neon"))) int8x8_t vtbx4_s8(int8x8_t __p0, int8x8x4_t __p1, int8x8_t __p2) { 33914 int8x8_t __ret; 33915 __ret = (int8x8_t) __builtin_neon_vtbx4_v((int8x8_t)__p0, (int8x8_t)__p1.val[0], (int8x8_t)__p1.val[1], (int8x8_t)__p1.val[2], (int8x8_t)__p1.val[3], (int8x8_t)__p2, 0); 33916 return __ret; 33917 } 33918 #else 33919 __ai __attribute__((target("neon"))) int8x8_t vtbx4_s8(int8x8_t __p0, int8x8x4_t __p1, int8x8_t __p2) { 33920 int8x8_t __ret; 33921 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 33922 int8x8x4_t __rev1; 33923 __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 33924 __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 33925 __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); 33926 __rev1.val[3] = __builtin_shufflevector(__p1.val[3], __p1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); 33927 int8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 33928 __ret = (int8x8_t) __builtin_neon_vtbx4_v((int8x8_t)__rev0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], (int8x8_t)__rev2, 0); 33929 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 33930 return __ret; 33931 } 33932 #endif 33933 33934 #ifdef __LITTLE_ENDIAN__ 33935 __ai __attribute__((target("neon"))) poly8x8x2_t vtrn_p8(poly8x8_t __p0, poly8x8_t __p1) { 33936 poly8x8x2_t __ret; 33937 __builtin_neon_vtrn_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 4); 33938 return __ret; 33939 } 33940 #else 33941 __ai __attribute__((target("neon"))) poly8x8x2_t vtrn_p8(poly8x8_t __p0, poly8x8_t __p1) { 33942 poly8x8x2_t __ret; 33943 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 33944 poly8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 33945 __builtin_neon_vtrn_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 4); 33946 33947 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 33948 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 33949 return __ret; 33950 } 33951 #endif 33952 33953 #ifdef __LITTLE_ENDIAN__ 33954 __ai __attribute__((target("neon"))) poly16x4x2_t vtrn_p16(poly16x4_t __p0, poly16x4_t __p1) { 33955 poly16x4x2_t __ret; 33956 __builtin_neon_vtrn_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 5); 33957 return __ret; 33958 } 33959 #else 33960 __ai __attribute__((target("neon"))) poly16x4x2_t vtrn_p16(poly16x4_t __p0, poly16x4_t __p1) { 33961 poly16x4x2_t __ret; 33962 poly16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 33963 poly16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 33964 __builtin_neon_vtrn_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 5); 33965 33966 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); 33967 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); 33968 return __ret; 33969 } 33970 #endif 33971 33972 #ifdef __LITTLE_ENDIAN__ 33973 __ai __attribute__((target("neon"))) poly8x16x2_t vtrnq_p8(poly8x16_t __p0, poly8x16_t __p1) { 33974 poly8x16x2_t __ret; 33975 __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 36); 33976 return __ret; 33977 } 33978 #else 33979 __ai __attribute__((target("neon"))) poly8x16x2_t vtrnq_p8(poly8x16_t __p0, poly8x16_t __p1) { 33980 poly8x16x2_t __ret; 33981 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 33982 poly8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 33983 __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 36); 33984 33985 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 33986 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 33987 return __ret; 33988 } 33989 #endif 33990 33991 #ifdef __LITTLE_ENDIAN__ 33992 __ai __attribute__((target("neon"))) poly16x8x2_t vtrnq_p16(poly16x8_t __p0, poly16x8_t __p1) { 33993 poly16x8x2_t __ret; 33994 __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 37); 33995 return __ret; 33996 } 33997 #else 33998 __ai __attribute__((target("neon"))) poly16x8x2_t vtrnq_p16(poly16x8_t __p0, poly16x8_t __p1) { 33999 poly16x8x2_t __ret; 34000 poly16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 34001 poly16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 34002 __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 37); 34003 34004 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 34005 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 34006 return __ret; 34007 } 34008 #endif 34009 34010 #ifdef __LITTLE_ENDIAN__ 34011 __ai __attribute__((target("neon"))) uint8x16x2_t vtrnq_u8(uint8x16_t __p0, uint8x16_t __p1) { 34012 uint8x16x2_t __ret; 34013 __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 48); 34014 return __ret; 34015 } 34016 #else 34017 __ai __attribute__((target("neon"))) uint8x16x2_t vtrnq_u8(uint8x16_t __p0, uint8x16_t __p1) { 34018 uint8x16x2_t __ret; 34019 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 34020 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 34021 __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 48); 34022 34023 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 34024 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 34025 return __ret; 34026 } 34027 #endif 34028 34029 #ifdef __LITTLE_ENDIAN__ 34030 __ai __attribute__((target("neon"))) uint32x4x2_t vtrnq_u32(uint32x4_t __p0, uint32x4_t __p1) { 34031 uint32x4x2_t __ret; 34032 __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 50); 34033 return __ret; 34034 } 34035 #else 34036 __ai __attribute__((target("neon"))) uint32x4x2_t vtrnq_u32(uint32x4_t __p0, uint32x4_t __p1) { 34037 uint32x4x2_t __ret; 34038 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 34039 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 34040 __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 50); 34041 34042 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); 34043 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); 34044 return __ret; 34045 } 34046 #endif 34047 34048 #ifdef __LITTLE_ENDIAN__ 34049 __ai __attribute__((target("neon"))) uint16x8x2_t vtrnq_u16(uint16x8_t __p0, uint16x8_t __p1) { 34050 uint16x8x2_t __ret; 34051 __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 49); 34052 return __ret; 34053 } 34054 #else 34055 __ai __attribute__((target("neon"))) uint16x8x2_t vtrnq_u16(uint16x8_t __p0, uint16x8_t __p1) { 34056 uint16x8x2_t __ret; 34057 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 34058 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 34059 __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 49); 34060 34061 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 34062 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 34063 return __ret; 34064 } 34065 #endif 34066 34067 #ifdef __LITTLE_ENDIAN__ 34068 __ai __attribute__((target("neon"))) int8x16x2_t vtrnq_s8(int8x16_t __p0, int8x16_t __p1) { 34069 int8x16x2_t __ret; 34070 __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 32); 34071 return __ret; 34072 } 34073 #else 34074 __ai __attribute__((target("neon"))) int8x16x2_t vtrnq_s8(int8x16_t __p0, int8x16_t __p1) { 34075 int8x16x2_t __ret; 34076 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 34077 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 34078 __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 32); 34079 34080 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 34081 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 34082 return __ret; 34083 } 34084 #endif 34085 34086 #ifdef __LITTLE_ENDIAN__ 34087 __ai __attribute__((target("neon"))) float32x4x2_t vtrnq_f32(float32x4_t __p0, float32x4_t __p1) { 34088 float32x4x2_t __ret; 34089 __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 41); 34090 return __ret; 34091 } 34092 #else 34093 __ai __attribute__((target("neon"))) float32x4x2_t vtrnq_f32(float32x4_t __p0, float32x4_t __p1) { 34094 float32x4x2_t __ret; 34095 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 34096 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 34097 __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 41); 34098 34099 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); 34100 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); 34101 return __ret; 34102 } 34103 #endif 34104 34105 #ifdef __LITTLE_ENDIAN__ 34106 __ai __attribute__((target("neon"))) int32x4x2_t vtrnq_s32(int32x4_t __p0, int32x4_t __p1) { 34107 int32x4x2_t __ret; 34108 __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 34); 34109 return __ret; 34110 } 34111 #else 34112 __ai __attribute__((target("neon"))) int32x4x2_t vtrnq_s32(int32x4_t __p0, int32x4_t __p1) { 34113 int32x4x2_t __ret; 34114 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 34115 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 34116 __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 34); 34117 34118 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); 34119 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); 34120 return __ret; 34121 } 34122 #endif 34123 34124 #ifdef __LITTLE_ENDIAN__ 34125 __ai __attribute__((target("neon"))) int16x8x2_t vtrnq_s16(int16x8_t __p0, int16x8_t __p1) { 34126 int16x8x2_t __ret; 34127 __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 33); 34128 return __ret; 34129 } 34130 #else 34131 __ai __attribute__((target("neon"))) int16x8x2_t vtrnq_s16(int16x8_t __p0, int16x8_t __p1) { 34132 int16x8x2_t __ret; 34133 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 34134 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 34135 __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 33); 34136 34137 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 34138 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 34139 return __ret; 34140 } 34141 #endif 34142 34143 #ifdef __LITTLE_ENDIAN__ 34144 __ai __attribute__((target("neon"))) uint8x8x2_t vtrn_u8(uint8x8_t __p0, uint8x8_t __p1) { 34145 uint8x8x2_t __ret; 34146 __builtin_neon_vtrn_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 16); 34147 return __ret; 34148 } 34149 #else 34150 __ai __attribute__((target("neon"))) uint8x8x2_t vtrn_u8(uint8x8_t __p0, uint8x8_t __p1) { 34151 uint8x8x2_t __ret; 34152 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 34153 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 34154 __builtin_neon_vtrn_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 16); 34155 34156 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 34157 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 34158 return __ret; 34159 } 34160 #endif 34161 34162 #ifdef __LITTLE_ENDIAN__ 34163 __ai __attribute__((target("neon"))) uint32x2x2_t vtrn_u32(uint32x2_t __p0, uint32x2_t __p1) { 34164 uint32x2x2_t __ret; 34165 __builtin_neon_vtrn_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 18); 34166 return __ret; 34167 } 34168 #else 34169 __ai __attribute__((target("neon"))) uint32x2x2_t vtrn_u32(uint32x2_t __p0, uint32x2_t __p1) { 34170 uint32x2x2_t __ret; 34171 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 34172 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 34173 __builtin_neon_vtrn_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 18); 34174 34175 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); 34176 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); 34177 return __ret; 34178 } 34179 #endif 34180 34181 #ifdef __LITTLE_ENDIAN__ 34182 __ai __attribute__((target("neon"))) uint16x4x2_t vtrn_u16(uint16x4_t __p0, uint16x4_t __p1) { 34183 uint16x4x2_t __ret; 34184 __builtin_neon_vtrn_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 17); 34185 return __ret; 34186 } 34187 #else 34188 __ai __attribute__((target("neon"))) uint16x4x2_t vtrn_u16(uint16x4_t __p0, uint16x4_t __p1) { 34189 uint16x4x2_t __ret; 34190 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 34191 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 34192 __builtin_neon_vtrn_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 17); 34193 34194 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); 34195 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); 34196 return __ret; 34197 } 34198 #endif 34199 34200 #ifdef __LITTLE_ENDIAN__ 34201 __ai __attribute__((target("neon"))) int8x8x2_t vtrn_s8(int8x8_t __p0, int8x8_t __p1) { 34202 int8x8x2_t __ret; 34203 __builtin_neon_vtrn_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 0); 34204 return __ret; 34205 } 34206 #else 34207 __ai __attribute__((target("neon"))) int8x8x2_t vtrn_s8(int8x8_t __p0, int8x8_t __p1) { 34208 int8x8x2_t __ret; 34209 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 34210 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 34211 __builtin_neon_vtrn_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 0); 34212 34213 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 34214 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 34215 return __ret; 34216 } 34217 #endif 34218 34219 #ifdef __LITTLE_ENDIAN__ 34220 __ai __attribute__((target("neon"))) float32x2x2_t vtrn_f32(float32x2_t __p0, float32x2_t __p1) { 34221 float32x2x2_t __ret; 34222 __builtin_neon_vtrn_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 9); 34223 return __ret; 34224 } 34225 #else 34226 __ai __attribute__((target("neon"))) float32x2x2_t vtrn_f32(float32x2_t __p0, float32x2_t __p1) { 34227 float32x2x2_t __ret; 34228 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 34229 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 34230 __builtin_neon_vtrn_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 9); 34231 34232 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); 34233 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); 34234 return __ret; 34235 } 34236 #endif 34237 34238 #ifdef __LITTLE_ENDIAN__ 34239 __ai __attribute__((target("neon"))) int32x2x2_t vtrn_s32(int32x2_t __p0, int32x2_t __p1) { 34240 int32x2x2_t __ret; 34241 __builtin_neon_vtrn_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 2); 34242 return __ret; 34243 } 34244 #else 34245 __ai __attribute__((target("neon"))) int32x2x2_t vtrn_s32(int32x2_t __p0, int32x2_t __p1) { 34246 int32x2x2_t __ret; 34247 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 34248 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 34249 __builtin_neon_vtrn_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 2); 34250 34251 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); 34252 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); 34253 return __ret; 34254 } 34255 #endif 34256 34257 #ifdef __LITTLE_ENDIAN__ 34258 __ai __attribute__((target("neon"))) int16x4x2_t vtrn_s16(int16x4_t __p0, int16x4_t __p1) { 34259 int16x4x2_t __ret; 34260 __builtin_neon_vtrn_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 1); 34261 return __ret; 34262 } 34263 #else 34264 __ai __attribute__((target("neon"))) int16x4x2_t vtrn_s16(int16x4_t __p0, int16x4_t __p1) { 34265 int16x4x2_t __ret; 34266 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 34267 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 34268 __builtin_neon_vtrn_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 1); 34269 34270 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); 34271 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); 34272 return __ret; 34273 } 34274 #endif 34275 34276 #ifdef __LITTLE_ENDIAN__ 34277 __ai __attribute__((target("neon"))) float16x8x2_t vtrnq_f16(float16x8_t __p0, float16x8_t __p1) { 34278 float16x8x2_t __ret; 34279 __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 40); 34280 return __ret; 34281 } 34282 #else 34283 __ai __attribute__((target("neon"))) float16x8x2_t vtrnq_f16(float16x8_t __p0, float16x8_t __p1) { 34284 float16x8x2_t __ret; 34285 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 34286 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 34287 __builtin_neon_vtrnq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 40); 34288 34289 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 34290 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 34291 return __ret; 34292 } 34293 #endif 34294 34295 #ifdef __LITTLE_ENDIAN__ 34296 __ai __attribute__((target("neon"))) float16x4x2_t vtrn_f16(float16x4_t __p0, float16x4_t __p1) { 34297 float16x4x2_t __ret; 34298 __builtin_neon_vtrn_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 8); 34299 return __ret; 34300 } 34301 #else 34302 __ai __attribute__((target("neon"))) float16x4x2_t vtrn_f16(float16x4_t __p0, float16x4_t __p1) { 34303 float16x4x2_t __ret; 34304 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 34305 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 34306 __builtin_neon_vtrn_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 8); 34307 34308 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); 34309 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); 34310 return __ret; 34311 } 34312 #endif 34313 34314 #ifdef __LITTLE_ENDIAN__ 34315 __ai __attribute__((target("neon"))) uint8x8_t vtst_p8(poly8x8_t __p0, poly8x8_t __p1) { 34316 uint8x8_t __ret; 34317 __ret = (uint8x8_t) __builtin_neon_vtst_v((int8x8_t)__p0, (int8x8_t)__p1, 16); 34318 return __ret; 34319 } 34320 #else 34321 __ai __attribute__((target("neon"))) uint8x8_t vtst_p8(poly8x8_t __p0, poly8x8_t __p1) { 34322 uint8x8_t __ret; 34323 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 34324 poly8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 34325 __ret = (uint8x8_t) __builtin_neon_vtst_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16); 34326 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 34327 return __ret; 34328 } 34329 #endif 34330 34331 #ifdef __LITTLE_ENDIAN__ 34332 __ai __attribute__((target("neon"))) uint16x4_t vtst_p16(poly16x4_t __p0, poly16x4_t __p1) { 34333 uint16x4_t __ret; 34334 __ret = (uint16x4_t) __builtin_neon_vtst_v((int8x8_t)__p0, (int8x8_t)__p1, 17); 34335 return __ret; 34336 } 34337 #else 34338 __ai __attribute__((target("neon"))) uint16x4_t vtst_p16(poly16x4_t __p0, poly16x4_t __p1) { 34339 uint16x4_t __ret; 34340 poly16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 34341 poly16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 34342 __ret = (uint16x4_t) __builtin_neon_vtst_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17); 34343 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 34344 return __ret; 34345 } 34346 #endif 34347 34348 #ifdef __LITTLE_ENDIAN__ 34349 __ai __attribute__((target("neon"))) uint8x16_t vtstq_p8(poly8x16_t __p0, poly8x16_t __p1) { 34350 uint8x16_t __ret; 34351 __ret = (uint8x16_t) __builtin_neon_vtstq_v((int8x16_t)__p0, (int8x16_t)__p1, 48); 34352 return __ret; 34353 } 34354 #else 34355 __ai __attribute__((target("neon"))) uint8x16_t vtstq_p8(poly8x16_t __p0, poly8x16_t __p1) { 34356 uint8x16_t __ret; 34357 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 34358 poly8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 34359 __ret = (uint8x16_t) __builtin_neon_vtstq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48); 34360 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 34361 return __ret; 34362 } 34363 #endif 34364 34365 #ifdef __LITTLE_ENDIAN__ 34366 __ai __attribute__((target("neon"))) uint16x8_t vtstq_p16(poly16x8_t __p0, poly16x8_t __p1) { 34367 uint16x8_t __ret; 34368 __ret = (uint16x8_t) __builtin_neon_vtstq_v((int8x16_t)__p0, (int8x16_t)__p1, 49); 34369 return __ret; 34370 } 34371 #else 34372 __ai __attribute__((target("neon"))) uint16x8_t vtstq_p16(poly16x8_t __p0, poly16x8_t __p1) { 34373 uint16x8_t __ret; 34374 poly16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 34375 poly16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 34376 __ret = (uint16x8_t) __builtin_neon_vtstq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49); 34377 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 34378 return __ret; 34379 } 34380 #endif 34381 34382 #ifdef __LITTLE_ENDIAN__ 34383 __ai __attribute__((target("neon"))) uint8x16_t vtstq_u8(uint8x16_t __p0, uint8x16_t __p1) { 34384 uint8x16_t __ret; 34385 __ret = (uint8x16_t) __builtin_neon_vtstq_v((int8x16_t)__p0, (int8x16_t)__p1, 48); 34386 return __ret; 34387 } 34388 #else 34389 __ai __attribute__((target("neon"))) uint8x16_t vtstq_u8(uint8x16_t __p0, uint8x16_t __p1) { 34390 uint8x16_t __ret; 34391 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 34392 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 34393 __ret = (uint8x16_t) __builtin_neon_vtstq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48); 34394 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 34395 return __ret; 34396 } 34397 #endif 34398 34399 #ifdef __LITTLE_ENDIAN__ 34400 __ai __attribute__((target("neon"))) uint32x4_t vtstq_u32(uint32x4_t __p0, uint32x4_t __p1) { 34401 uint32x4_t __ret; 34402 __ret = (uint32x4_t) __builtin_neon_vtstq_v((int8x16_t)__p0, (int8x16_t)__p1, 50); 34403 return __ret; 34404 } 34405 #else 34406 __ai __attribute__((target("neon"))) uint32x4_t vtstq_u32(uint32x4_t __p0, uint32x4_t __p1) { 34407 uint32x4_t __ret; 34408 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 34409 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 34410 __ret = (uint32x4_t) __builtin_neon_vtstq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50); 34411 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 34412 return __ret; 34413 } 34414 #endif 34415 34416 #ifdef __LITTLE_ENDIAN__ 34417 __ai __attribute__((target("neon"))) uint16x8_t vtstq_u16(uint16x8_t __p0, uint16x8_t __p1) { 34418 uint16x8_t __ret; 34419 __ret = (uint16x8_t) __builtin_neon_vtstq_v((int8x16_t)__p0, (int8x16_t)__p1, 49); 34420 return __ret; 34421 } 34422 #else 34423 __ai __attribute__((target("neon"))) uint16x8_t vtstq_u16(uint16x8_t __p0, uint16x8_t __p1) { 34424 uint16x8_t __ret; 34425 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 34426 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 34427 __ret = (uint16x8_t) __builtin_neon_vtstq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49); 34428 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 34429 return __ret; 34430 } 34431 #endif 34432 34433 #ifdef __LITTLE_ENDIAN__ 34434 __ai __attribute__((target("neon"))) uint8x16_t vtstq_s8(int8x16_t __p0, int8x16_t __p1) { 34435 uint8x16_t __ret; 34436 __ret = (uint8x16_t) __builtin_neon_vtstq_v((int8x16_t)__p0, (int8x16_t)__p1, 48); 34437 return __ret; 34438 } 34439 #else 34440 __ai __attribute__((target("neon"))) uint8x16_t vtstq_s8(int8x16_t __p0, int8x16_t __p1) { 34441 uint8x16_t __ret; 34442 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 34443 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 34444 __ret = (uint8x16_t) __builtin_neon_vtstq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48); 34445 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 34446 return __ret; 34447 } 34448 #endif 34449 34450 #ifdef __LITTLE_ENDIAN__ 34451 __ai __attribute__((target("neon"))) uint32x4_t vtstq_s32(int32x4_t __p0, int32x4_t __p1) { 34452 uint32x4_t __ret; 34453 __ret = (uint32x4_t) __builtin_neon_vtstq_v((int8x16_t)__p0, (int8x16_t)__p1, 50); 34454 return __ret; 34455 } 34456 #else 34457 __ai __attribute__((target("neon"))) uint32x4_t vtstq_s32(int32x4_t __p0, int32x4_t __p1) { 34458 uint32x4_t __ret; 34459 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 34460 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 34461 __ret = (uint32x4_t) __builtin_neon_vtstq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50); 34462 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 34463 return __ret; 34464 } 34465 #endif 34466 34467 #ifdef __LITTLE_ENDIAN__ 34468 __ai __attribute__((target("neon"))) uint16x8_t vtstq_s16(int16x8_t __p0, int16x8_t __p1) { 34469 uint16x8_t __ret; 34470 __ret = (uint16x8_t) __builtin_neon_vtstq_v((int8x16_t)__p0, (int8x16_t)__p1, 49); 34471 return __ret; 34472 } 34473 #else 34474 __ai __attribute__((target("neon"))) uint16x8_t vtstq_s16(int16x8_t __p0, int16x8_t __p1) { 34475 uint16x8_t __ret; 34476 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 34477 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 34478 __ret = (uint16x8_t) __builtin_neon_vtstq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49); 34479 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 34480 return __ret; 34481 } 34482 #endif 34483 34484 #ifdef __LITTLE_ENDIAN__ 34485 __ai __attribute__((target("neon"))) uint8x8_t vtst_u8(uint8x8_t __p0, uint8x8_t __p1) { 34486 uint8x8_t __ret; 34487 __ret = (uint8x8_t) __builtin_neon_vtst_v((int8x8_t)__p0, (int8x8_t)__p1, 16); 34488 return __ret; 34489 } 34490 #else 34491 __ai __attribute__((target("neon"))) uint8x8_t vtst_u8(uint8x8_t __p0, uint8x8_t __p1) { 34492 uint8x8_t __ret; 34493 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 34494 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 34495 __ret = (uint8x8_t) __builtin_neon_vtst_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16); 34496 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 34497 return __ret; 34498 } 34499 #endif 34500 34501 #ifdef __LITTLE_ENDIAN__ 34502 __ai __attribute__((target("neon"))) uint32x2_t vtst_u32(uint32x2_t __p0, uint32x2_t __p1) { 34503 uint32x2_t __ret; 34504 __ret = (uint32x2_t) __builtin_neon_vtst_v((int8x8_t)__p0, (int8x8_t)__p1, 18); 34505 return __ret; 34506 } 34507 #else 34508 __ai __attribute__((target("neon"))) uint32x2_t vtst_u32(uint32x2_t __p0, uint32x2_t __p1) { 34509 uint32x2_t __ret; 34510 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 34511 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 34512 __ret = (uint32x2_t) __builtin_neon_vtst_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18); 34513 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 34514 return __ret; 34515 } 34516 #endif 34517 34518 #ifdef __LITTLE_ENDIAN__ 34519 __ai __attribute__((target("neon"))) uint16x4_t vtst_u16(uint16x4_t __p0, uint16x4_t __p1) { 34520 uint16x4_t __ret; 34521 __ret = (uint16x4_t) __builtin_neon_vtst_v((int8x8_t)__p0, (int8x8_t)__p1, 17); 34522 return __ret; 34523 } 34524 #else 34525 __ai __attribute__((target("neon"))) uint16x4_t vtst_u16(uint16x4_t __p0, uint16x4_t __p1) { 34526 uint16x4_t __ret; 34527 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 34528 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 34529 __ret = (uint16x4_t) __builtin_neon_vtst_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17); 34530 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 34531 return __ret; 34532 } 34533 #endif 34534 34535 #ifdef __LITTLE_ENDIAN__ 34536 __ai __attribute__((target("neon"))) uint8x8_t vtst_s8(int8x8_t __p0, int8x8_t __p1) { 34537 uint8x8_t __ret; 34538 __ret = (uint8x8_t) __builtin_neon_vtst_v((int8x8_t)__p0, (int8x8_t)__p1, 16); 34539 return __ret; 34540 } 34541 #else 34542 __ai __attribute__((target("neon"))) uint8x8_t vtst_s8(int8x8_t __p0, int8x8_t __p1) { 34543 uint8x8_t __ret; 34544 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 34545 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 34546 __ret = (uint8x8_t) __builtin_neon_vtst_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16); 34547 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 34548 return __ret; 34549 } 34550 #endif 34551 34552 #ifdef __LITTLE_ENDIAN__ 34553 __ai __attribute__((target("neon"))) uint32x2_t vtst_s32(int32x2_t __p0, int32x2_t __p1) { 34554 uint32x2_t __ret; 34555 __ret = (uint32x2_t) __builtin_neon_vtst_v((int8x8_t)__p0, (int8x8_t)__p1, 18); 34556 return __ret; 34557 } 34558 #else 34559 __ai __attribute__((target("neon"))) uint32x2_t vtst_s32(int32x2_t __p0, int32x2_t __p1) { 34560 uint32x2_t __ret; 34561 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 34562 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 34563 __ret = (uint32x2_t) __builtin_neon_vtst_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18); 34564 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 34565 return __ret; 34566 } 34567 #endif 34568 34569 #ifdef __LITTLE_ENDIAN__ 34570 __ai __attribute__((target("neon"))) uint16x4_t vtst_s16(int16x4_t __p0, int16x4_t __p1) { 34571 uint16x4_t __ret; 34572 __ret = (uint16x4_t) __builtin_neon_vtst_v((int8x8_t)__p0, (int8x8_t)__p1, 17); 34573 return __ret; 34574 } 34575 #else 34576 __ai __attribute__((target("neon"))) uint16x4_t vtst_s16(int16x4_t __p0, int16x4_t __p1) { 34577 uint16x4_t __ret; 34578 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 34579 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 34580 __ret = (uint16x4_t) __builtin_neon_vtst_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17); 34581 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 34582 return __ret; 34583 } 34584 #endif 34585 34586 #ifdef __LITTLE_ENDIAN__ 34587 __ai __attribute__((target("neon"))) poly8x8x2_t vuzp_p8(poly8x8_t __p0, poly8x8_t __p1) { 34588 poly8x8x2_t __ret; 34589 __builtin_neon_vuzp_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 4); 34590 return __ret; 34591 } 34592 #else 34593 __ai __attribute__((target("neon"))) poly8x8x2_t vuzp_p8(poly8x8_t __p0, poly8x8_t __p1) { 34594 poly8x8x2_t __ret; 34595 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 34596 poly8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 34597 __builtin_neon_vuzp_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 4); 34598 34599 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 34600 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 34601 return __ret; 34602 } 34603 #endif 34604 34605 #ifdef __LITTLE_ENDIAN__ 34606 __ai __attribute__((target("neon"))) poly16x4x2_t vuzp_p16(poly16x4_t __p0, poly16x4_t __p1) { 34607 poly16x4x2_t __ret; 34608 __builtin_neon_vuzp_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 5); 34609 return __ret; 34610 } 34611 #else 34612 __ai __attribute__((target("neon"))) poly16x4x2_t vuzp_p16(poly16x4_t __p0, poly16x4_t __p1) { 34613 poly16x4x2_t __ret; 34614 poly16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 34615 poly16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 34616 __builtin_neon_vuzp_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 5); 34617 34618 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); 34619 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); 34620 return __ret; 34621 } 34622 #endif 34623 34624 #ifdef __LITTLE_ENDIAN__ 34625 __ai __attribute__((target("neon"))) poly8x16x2_t vuzpq_p8(poly8x16_t __p0, poly8x16_t __p1) { 34626 poly8x16x2_t __ret; 34627 __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 36); 34628 return __ret; 34629 } 34630 #else 34631 __ai __attribute__((target("neon"))) poly8x16x2_t vuzpq_p8(poly8x16_t __p0, poly8x16_t __p1) { 34632 poly8x16x2_t __ret; 34633 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 34634 poly8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 34635 __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 36); 34636 34637 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 34638 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 34639 return __ret; 34640 } 34641 #endif 34642 34643 #ifdef __LITTLE_ENDIAN__ 34644 __ai __attribute__((target("neon"))) poly16x8x2_t vuzpq_p16(poly16x8_t __p0, poly16x8_t __p1) { 34645 poly16x8x2_t __ret; 34646 __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 37); 34647 return __ret; 34648 } 34649 #else 34650 __ai __attribute__((target("neon"))) poly16x8x2_t vuzpq_p16(poly16x8_t __p0, poly16x8_t __p1) { 34651 poly16x8x2_t __ret; 34652 poly16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 34653 poly16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 34654 __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 37); 34655 34656 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 34657 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 34658 return __ret; 34659 } 34660 #endif 34661 34662 #ifdef __LITTLE_ENDIAN__ 34663 __ai __attribute__((target("neon"))) uint8x16x2_t vuzpq_u8(uint8x16_t __p0, uint8x16_t __p1) { 34664 uint8x16x2_t __ret; 34665 __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 48); 34666 return __ret; 34667 } 34668 #else 34669 __ai __attribute__((target("neon"))) uint8x16x2_t vuzpq_u8(uint8x16_t __p0, uint8x16_t __p1) { 34670 uint8x16x2_t __ret; 34671 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 34672 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 34673 __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 48); 34674 34675 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 34676 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 34677 return __ret; 34678 } 34679 #endif 34680 34681 #ifdef __LITTLE_ENDIAN__ 34682 __ai __attribute__((target("neon"))) uint32x4x2_t vuzpq_u32(uint32x4_t __p0, uint32x4_t __p1) { 34683 uint32x4x2_t __ret; 34684 __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 50); 34685 return __ret; 34686 } 34687 #else 34688 __ai __attribute__((target("neon"))) uint32x4x2_t vuzpq_u32(uint32x4_t __p0, uint32x4_t __p1) { 34689 uint32x4x2_t __ret; 34690 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 34691 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 34692 __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 50); 34693 34694 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); 34695 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); 34696 return __ret; 34697 } 34698 #endif 34699 34700 #ifdef __LITTLE_ENDIAN__ 34701 __ai __attribute__((target("neon"))) uint16x8x2_t vuzpq_u16(uint16x8_t __p0, uint16x8_t __p1) { 34702 uint16x8x2_t __ret; 34703 __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 49); 34704 return __ret; 34705 } 34706 #else 34707 __ai __attribute__((target("neon"))) uint16x8x2_t vuzpq_u16(uint16x8_t __p0, uint16x8_t __p1) { 34708 uint16x8x2_t __ret; 34709 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 34710 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 34711 __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 49); 34712 34713 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 34714 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 34715 return __ret; 34716 } 34717 #endif 34718 34719 #ifdef __LITTLE_ENDIAN__ 34720 __ai __attribute__((target("neon"))) int8x16x2_t vuzpq_s8(int8x16_t __p0, int8x16_t __p1) { 34721 int8x16x2_t __ret; 34722 __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 32); 34723 return __ret; 34724 } 34725 #else 34726 __ai __attribute__((target("neon"))) int8x16x2_t vuzpq_s8(int8x16_t __p0, int8x16_t __p1) { 34727 int8x16x2_t __ret; 34728 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 34729 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 34730 __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 32); 34731 34732 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 34733 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 34734 return __ret; 34735 } 34736 #endif 34737 34738 #ifdef __LITTLE_ENDIAN__ 34739 __ai __attribute__((target("neon"))) float32x4x2_t vuzpq_f32(float32x4_t __p0, float32x4_t __p1) { 34740 float32x4x2_t __ret; 34741 __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 41); 34742 return __ret; 34743 } 34744 #else 34745 __ai __attribute__((target("neon"))) float32x4x2_t vuzpq_f32(float32x4_t __p0, float32x4_t __p1) { 34746 float32x4x2_t __ret; 34747 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 34748 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 34749 __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 41); 34750 34751 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); 34752 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); 34753 return __ret; 34754 } 34755 #endif 34756 34757 #ifdef __LITTLE_ENDIAN__ 34758 __ai __attribute__((target("neon"))) int32x4x2_t vuzpq_s32(int32x4_t __p0, int32x4_t __p1) { 34759 int32x4x2_t __ret; 34760 __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 34); 34761 return __ret; 34762 } 34763 #else 34764 __ai __attribute__((target("neon"))) int32x4x2_t vuzpq_s32(int32x4_t __p0, int32x4_t __p1) { 34765 int32x4x2_t __ret; 34766 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 34767 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 34768 __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 34); 34769 34770 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); 34771 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); 34772 return __ret; 34773 } 34774 #endif 34775 34776 #ifdef __LITTLE_ENDIAN__ 34777 __ai __attribute__((target("neon"))) int16x8x2_t vuzpq_s16(int16x8_t __p0, int16x8_t __p1) { 34778 int16x8x2_t __ret; 34779 __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 33); 34780 return __ret; 34781 } 34782 #else 34783 __ai __attribute__((target("neon"))) int16x8x2_t vuzpq_s16(int16x8_t __p0, int16x8_t __p1) { 34784 int16x8x2_t __ret; 34785 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 34786 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 34787 __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 33); 34788 34789 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 34790 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 34791 return __ret; 34792 } 34793 #endif 34794 34795 #ifdef __LITTLE_ENDIAN__ 34796 __ai __attribute__((target("neon"))) uint8x8x2_t vuzp_u8(uint8x8_t __p0, uint8x8_t __p1) { 34797 uint8x8x2_t __ret; 34798 __builtin_neon_vuzp_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 16); 34799 return __ret; 34800 } 34801 #else 34802 __ai __attribute__((target("neon"))) uint8x8x2_t vuzp_u8(uint8x8_t __p0, uint8x8_t __p1) { 34803 uint8x8x2_t __ret; 34804 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 34805 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 34806 __builtin_neon_vuzp_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 16); 34807 34808 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 34809 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 34810 return __ret; 34811 } 34812 #endif 34813 34814 #ifdef __LITTLE_ENDIAN__ 34815 __ai __attribute__((target("neon"))) uint32x2x2_t vuzp_u32(uint32x2_t __p0, uint32x2_t __p1) { 34816 uint32x2x2_t __ret; 34817 __builtin_neon_vuzp_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 18); 34818 return __ret; 34819 } 34820 #else 34821 __ai __attribute__((target("neon"))) uint32x2x2_t vuzp_u32(uint32x2_t __p0, uint32x2_t __p1) { 34822 uint32x2x2_t __ret; 34823 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 34824 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 34825 __builtin_neon_vuzp_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 18); 34826 34827 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); 34828 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); 34829 return __ret; 34830 } 34831 #endif 34832 34833 #ifdef __LITTLE_ENDIAN__ 34834 __ai __attribute__((target("neon"))) uint16x4x2_t vuzp_u16(uint16x4_t __p0, uint16x4_t __p1) { 34835 uint16x4x2_t __ret; 34836 __builtin_neon_vuzp_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 17); 34837 return __ret; 34838 } 34839 #else 34840 __ai __attribute__((target("neon"))) uint16x4x2_t vuzp_u16(uint16x4_t __p0, uint16x4_t __p1) { 34841 uint16x4x2_t __ret; 34842 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 34843 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 34844 __builtin_neon_vuzp_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 17); 34845 34846 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); 34847 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); 34848 return __ret; 34849 } 34850 #endif 34851 34852 #ifdef __LITTLE_ENDIAN__ 34853 __ai __attribute__((target("neon"))) int8x8x2_t vuzp_s8(int8x8_t __p0, int8x8_t __p1) { 34854 int8x8x2_t __ret; 34855 __builtin_neon_vuzp_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 0); 34856 return __ret; 34857 } 34858 #else 34859 __ai __attribute__((target("neon"))) int8x8x2_t vuzp_s8(int8x8_t __p0, int8x8_t __p1) { 34860 int8x8x2_t __ret; 34861 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 34862 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 34863 __builtin_neon_vuzp_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 0); 34864 34865 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 34866 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 34867 return __ret; 34868 } 34869 #endif 34870 34871 #ifdef __LITTLE_ENDIAN__ 34872 __ai __attribute__((target("neon"))) float32x2x2_t vuzp_f32(float32x2_t __p0, float32x2_t __p1) { 34873 float32x2x2_t __ret; 34874 __builtin_neon_vuzp_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 9); 34875 return __ret; 34876 } 34877 #else 34878 __ai __attribute__((target("neon"))) float32x2x2_t vuzp_f32(float32x2_t __p0, float32x2_t __p1) { 34879 float32x2x2_t __ret; 34880 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 34881 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 34882 __builtin_neon_vuzp_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 9); 34883 34884 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); 34885 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); 34886 return __ret; 34887 } 34888 #endif 34889 34890 #ifdef __LITTLE_ENDIAN__ 34891 __ai __attribute__((target("neon"))) int32x2x2_t vuzp_s32(int32x2_t __p0, int32x2_t __p1) { 34892 int32x2x2_t __ret; 34893 __builtin_neon_vuzp_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 2); 34894 return __ret; 34895 } 34896 #else 34897 __ai __attribute__((target("neon"))) int32x2x2_t vuzp_s32(int32x2_t __p0, int32x2_t __p1) { 34898 int32x2x2_t __ret; 34899 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 34900 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 34901 __builtin_neon_vuzp_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 2); 34902 34903 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); 34904 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); 34905 return __ret; 34906 } 34907 #endif 34908 34909 #ifdef __LITTLE_ENDIAN__ 34910 __ai __attribute__((target("neon"))) int16x4x2_t vuzp_s16(int16x4_t __p0, int16x4_t __p1) { 34911 int16x4x2_t __ret; 34912 __builtin_neon_vuzp_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 1); 34913 return __ret; 34914 } 34915 #else 34916 __ai __attribute__((target("neon"))) int16x4x2_t vuzp_s16(int16x4_t __p0, int16x4_t __p1) { 34917 int16x4x2_t __ret; 34918 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 34919 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 34920 __builtin_neon_vuzp_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 1); 34921 34922 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); 34923 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); 34924 return __ret; 34925 } 34926 #endif 34927 34928 #ifdef __LITTLE_ENDIAN__ 34929 __ai __attribute__((target("neon"))) float16x8x2_t vuzpq_f16(float16x8_t __p0, float16x8_t __p1) { 34930 float16x8x2_t __ret; 34931 __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 40); 34932 return __ret; 34933 } 34934 #else 34935 __ai __attribute__((target("neon"))) float16x8x2_t vuzpq_f16(float16x8_t __p0, float16x8_t __p1) { 34936 float16x8x2_t __ret; 34937 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 34938 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 34939 __builtin_neon_vuzpq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 40); 34940 34941 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 34942 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 34943 return __ret; 34944 } 34945 #endif 34946 34947 #ifdef __LITTLE_ENDIAN__ 34948 __ai __attribute__((target("neon"))) float16x4x2_t vuzp_f16(float16x4_t __p0, float16x4_t __p1) { 34949 float16x4x2_t __ret; 34950 __builtin_neon_vuzp_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 8); 34951 return __ret; 34952 } 34953 #else 34954 __ai __attribute__((target("neon"))) float16x4x2_t vuzp_f16(float16x4_t __p0, float16x4_t __p1) { 34955 float16x4x2_t __ret; 34956 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 34957 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 34958 __builtin_neon_vuzp_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 8); 34959 34960 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); 34961 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); 34962 return __ret; 34963 } 34964 #endif 34965 34966 #ifdef __LITTLE_ENDIAN__ 34967 __ai __attribute__((target("neon"))) poly8x8x2_t vzip_p8(poly8x8_t __p0, poly8x8_t __p1) { 34968 poly8x8x2_t __ret; 34969 __builtin_neon_vzip_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 4); 34970 return __ret; 34971 } 34972 #else 34973 __ai __attribute__((target("neon"))) poly8x8x2_t vzip_p8(poly8x8_t __p0, poly8x8_t __p1) { 34974 poly8x8x2_t __ret; 34975 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 34976 poly8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 34977 __builtin_neon_vzip_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 4); 34978 34979 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 34980 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 34981 return __ret; 34982 } 34983 #endif 34984 34985 #ifdef __LITTLE_ENDIAN__ 34986 __ai __attribute__((target("neon"))) poly16x4x2_t vzip_p16(poly16x4_t __p0, poly16x4_t __p1) { 34987 poly16x4x2_t __ret; 34988 __builtin_neon_vzip_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 5); 34989 return __ret; 34990 } 34991 #else 34992 __ai __attribute__((target("neon"))) poly16x4x2_t vzip_p16(poly16x4_t __p0, poly16x4_t __p1) { 34993 poly16x4x2_t __ret; 34994 poly16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 34995 poly16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 34996 __builtin_neon_vzip_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 5); 34997 34998 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); 34999 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); 35000 return __ret; 35001 } 35002 #endif 35003 35004 #ifdef __LITTLE_ENDIAN__ 35005 __ai __attribute__((target("neon"))) poly8x16x2_t vzipq_p8(poly8x16_t __p0, poly8x16_t __p1) { 35006 poly8x16x2_t __ret; 35007 __builtin_neon_vzipq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 36); 35008 return __ret; 35009 } 35010 #else 35011 __ai __attribute__((target("neon"))) poly8x16x2_t vzipq_p8(poly8x16_t __p0, poly8x16_t __p1) { 35012 poly8x16x2_t __ret; 35013 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 35014 poly8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 35015 __builtin_neon_vzipq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 36); 35016 35017 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 35018 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 35019 return __ret; 35020 } 35021 #endif 35022 35023 #ifdef __LITTLE_ENDIAN__ 35024 __ai __attribute__((target("neon"))) poly16x8x2_t vzipq_p16(poly16x8_t __p0, poly16x8_t __p1) { 35025 poly16x8x2_t __ret; 35026 __builtin_neon_vzipq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 37); 35027 return __ret; 35028 } 35029 #else 35030 __ai __attribute__((target("neon"))) poly16x8x2_t vzipq_p16(poly16x8_t __p0, poly16x8_t __p1) { 35031 poly16x8x2_t __ret; 35032 poly16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 35033 poly16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 35034 __builtin_neon_vzipq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 37); 35035 35036 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 35037 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 35038 return __ret; 35039 } 35040 #endif 35041 35042 #ifdef __LITTLE_ENDIAN__ 35043 __ai __attribute__((target("neon"))) uint8x16x2_t vzipq_u8(uint8x16_t __p0, uint8x16_t __p1) { 35044 uint8x16x2_t __ret; 35045 __builtin_neon_vzipq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 48); 35046 return __ret; 35047 } 35048 #else 35049 __ai __attribute__((target("neon"))) uint8x16x2_t vzipq_u8(uint8x16_t __p0, uint8x16_t __p1) { 35050 uint8x16x2_t __ret; 35051 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 35052 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 35053 __builtin_neon_vzipq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 48); 35054 35055 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 35056 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 35057 return __ret; 35058 } 35059 #endif 35060 35061 #ifdef __LITTLE_ENDIAN__ 35062 __ai __attribute__((target("neon"))) uint32x4x2_t vzipq_u32(uint32x4_t __p0, uint32x4_t __p1) { 35063 uint32x4x2_t __ret; 35064 __builtin_neon_vzipq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 50); 35065 return __ret; 35066 } 35067 #else 35068 __ai __attribute__((target("neon"))) uint32x4x2_t vzipq_u32(uint32x4_t __p0, uint32x4_t __p1) { 35069 uint32x4x2_t __ret; 35070 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 35071 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 35072 __builtin_neon_vzipq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 50); 35073 35074 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); 35075 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); 35076 return __ret; 35077 } 35078 #endif 35079 35080 #ifdef __LITTLE_ENDIAN__ 35081 __ai __attribute__((target("neon"))) uint16x8x2_t vzipq_u16(uint16x8_t __p0, uint16x8_t __p1) { 35082 uint16x8x2_t __ret; 35083 __builtin_neon_vzipq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 49); 35084 return __ret; 35085 } 35086 #else 35087 __ai __attribute__((target("neon"))) uint16x8x2_t vzipq_u16(uint16x8_t __p0, uint16x8_t __p1) { 35088 uint16x8x2_t __ret; 35089 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 35090 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 35091 __builtin_neon_vzipq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 49); 35092 35093 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 35094 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 35095 return __ret; 35096 } 35097 #endif 35098 35099 #ifdef __LITTLE_ENDIAN__ 35100 __ai __attribute__((target("neon"))) int8x16x2_t vzipq_s8(int8x16_t __p0, int8x16_t __p1) { 35101 int8x16x2_t __ret; 35102 __builtin_neon_vzipq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 32); 35103 return __ret; 35104 } 35105 #else 35106 __ai __attribute__((target("neon"))) int8x16x2_t vzipq_s8(int8x16_t __p0, int8x16_t __p1) { 35107 int8x16x2_t __ret; 35108 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 35109 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 35110 __builtin_neon_vzipq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 32); 35111 35112 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 35113 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 35114 return __ret; 35115 } 35116 #endif 35117 35118 #ifdef __LITTLE_ENDIAN__ 35119 __ai __attribute__((target("neon"))) float32x4x2_t vzipq_f32(float32x4_t __p0, float32x4_t __p1) { 35120 float32x4x2_t __ret; 35121 __builtin_neon_vzipq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 41); 35122 return __ret; 35123 } 35124 #else 35125 __ai __attribute__((target("neon"))) float32x4x2_t vzipq_f32(float32x4_t __p0, float32x4_t __p1) { 35126 float32x4x2_t __ret; 35127 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 35128 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 35129 __builtin_neon_vzipq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 41); 35130 35131 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); 35132 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); 35133 return __ret; 35134 } 35135 #endif 35136 35137 #ifdef __LITTLE_ENDIAN__ 35138 __ai __attribute__((target("neon"))) int32x4x2_t vzipq_s32(int32x4_t __p0, int32x4_t __p1) { 35139 int32x4x2_t __ret; 35140 __builtin_neon_vzipq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 34); 35141 return __ret; 35142 } 35143 #else 35144 __ai __attribute__((target("neon"))) int32x4x2_t vzipq_s32(int32x4_t __p0, int32x4_t __p1) { 35145 int32x4x2_t __ret; 35146 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 35147 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 35148 __builtin_neon_vzipq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 34); 35149 35150 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); 35151 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); 35152 return __ret; 35153 } 35154 #endif 35155 35156 #ifdef __LITTLE_ENDIAN__ 35157 __ai __attribute__((target("neon"))) int16x8x2_t vzipq_s16(int16x8_t __p0, int16x8_t __p1) { 35158 int16x8x2_t __ret; 35159 __builtin_neon_vzipq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 33); 35160 return __ret; 35161 } 35162 #else 35163 __ai __attribute__((target("neon"))) int16x8x2_t vzipq_s16(int16x8_t __p0, int16x8_t __p1) { 35164 int16x8x2_t __ret; 35165 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 35166 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 35167 __builtin_neon_vzipq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 33); 35168 35169 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 35170 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 35171 return __ret; 35172 } 35173 #endif 35174 35175 #ifdef __LITTLE_ENDIAN__ 35176 __ai __attribute__((target("neon"))) uint8x8x2_t vzip_u8(uint8x8_t __p0, uint8x8_t __p1) { 35177 uint8x8x2_t __ret; 35178 __builtin_neon_vzip_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 16); 35179 return __ret; 35180 } 35181 #else 35182 __ai __attribute__((target("neon"))) uint8x8x2_t vzip_u8(uint8x8_t __p0, uint8x8_t __p1) { 35183 uint8x8x2_t __ret; 35184 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 35185 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 35186 __builtin_neon_vzip_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 16); 35187 35188 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 35189 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 35190 return __ret; 35191 } 35192 #endif 35193 35194 #ifdef __LITTLE_ENDIAN__ 35195 __ai __attribute__((target("neon"))) uint32x2x2_t vzip_u32(uint32x2_t __p0, uint32x2_t __p1) { 35196 uint32x2x2_t __ret; 35197 __builtin_neon_vzip_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 18); 35198 return __ret; 35199 } 35200 #else 35201 __ai __attribute__((target("neon"))) uint32x2x2_t vzip_u32(uint32x2_t __p0, uint32x2_t __p1) { 35202 uint32x2x2_t __ret; 35203 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 35204 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 35205 __builtin_neon_vzip_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 18); 35206 35207 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); 35208 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); 35209 return __ret; 35210 } 35211 #endif 35212 35213 #ifdef __LITTLE_ENDIAN__ 35214 __ai __attribute__((target("neon"))) uint16x4x2_t vzip_u16(uint16x4_t __p0, uint16x4_t __p1) { 35215 uint16x4x2_t __ret; 35216 __builtin_neon_vzip_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 17); 35217 return __ret; 35218 } 35219 #else 35220 __ai __attribute__((target("neon"))) uint16x4x2_t vzip_u16(uint16x4_t __p0, uint16x4_t __p1) { 35221 uint16x4x2_t __ret; 35222 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 35223 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 35224 __builtin_neon_vzip_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 17); 35225 35226 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); 35227 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); 35228 return __ret; 35229 } 35230 #endif 35231 35232 #ifdef __LITTLE_ENDIAN__ 35233 __ai __attribute__((target("neon"))) int8x8x2_t vzip_s8(int8x8_t __p0, int8x8_t __p1) { 35234 int8x8x2_t __ret; 35235 __builtin_neon_vzip_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 0); 35236 return __ret; 35237 } 35238 #else 35239 __ai __attribute__((target("neon"))) int8x8x2_t vzip_s8(int8x8_t __p0, int8x8_t __p1) { 35240 int8x8x2_t __ret; 35241 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 35242 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 35243 __builtin_neon_vzip_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 0); 35244 35245 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 35246 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 35247 return __ret; 35248 } 35249 #endif 35250 35251 #ifdef __LITTLE_ENDIAN__ 35252 __ai __attribute__((target("neon"))) float32x2x2_t vzip_f32(float32x2_t __p0, float32x2_t __p1) { 35253 float32x2x2_t __ret; 35254 __builtin_neon_vzip_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 9); 35255 return __ret; 35256 } 35257 #else 35258 __ai __attribute__((target("neon"))) float32x2x2_t vzip_f32(float32x2_t __p0, float32x2_t __p1) { 35259 float32x2x2_t __ret; 35260 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 35261 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 35262 __builtin_neon_vzip_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 9); 35263 35264 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); 35265 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); 35266 return __ret; 35267 } 35268 #endif 35269 35270 #ifdef __LITTLE_ENDIAN__ 35271 __ai __attribute__((target("neon"))) int32x2x2_t vzip_s32(int32x2_t __p0, int32x2_t __p1) { 35272 int32x2x2_t __ret; 35273 __builtin_neon_vzip_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 2); 35274 return __ret; 35275 } 35276 #else 35277 __ai __attribute__((target("neon"))) int32x2x2_t vzip_s32(int32x2_t __p0, int32x2_t __p1) { 35278 int32x2x2_t __ret; 35279 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 35280 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 35281 __builtin_neon_vzip_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 2); 35282 35283 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); 35284 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); 35285 return __ret; 35286 } 35287 #endif 35288 35289 #ifdef __LITTLE_ENDIAN__ 35290 __ai __attribute__((target("neon"))) int16x4x2_t vzip_s16(int16x4_t __p0, int16x4_t __p1) { 35291 int16x4x2_t __ret; 35292 __builtin_neon_vzip_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 1); 35293 return __ret; 35294 } 35295 #else 35296 __ai __attribute__((target("neon"))) int16x4x2_t vzip_s16(int16x4_t __p0, int16x4_t __p1) { 35297 int16x4x2_t __ret; 35298 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 35299 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 35300 __builtin_neon_vzip_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 1); 35301 35302 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); 35303 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); 35304 return __ret; 35305 } 35306 #endif 35307 35308 #ifdef __LITTLE_ENDIAN__ 35309 __ai __attribute__((target("neon"))) float16x8x2_t vzipq_f16(float16x8_t __p0, float16x8_t __p1) { 35310 float16x8x2_t __ret; 35311 __builtin_neon_vzipq_v(&__ret, (int8x16_t)__p0, (int8x16_t)__p1, 40); 35312 return __ret; 35313 } 35314 #else 35315 __ai __attribute__((target("neon"))) float16x8x2_t vzipq_f16(float16x8_t __p0, float16x8_t __p1) { 35316 float16x8x2_t __ret; 35317 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 35318 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 35319 __builtin_neon_vzipq_v(&__ret, (int8x16_t)__rev0, (int8x16_t)__rev1, 40); 35320 35321 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); 35322 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); 35323 return __ret; 35324 } 35325 #endif 35326 35327 #ifdef __LITTLE_ENDIAN__ 35328 __ai __attribute__((target("neon"))) float16x4x2_t vzip_f16(float16x4_t __p0, float16x4_t __p1) { 35329 float16x4x2_t __ret; 35330 __builtin_neon_vzip_v(&__ret, (int8x8_t)__p0, (int8x8_t)__p1, 8); 35331 return __ret; 35332 } 35333 #else 35334 __ai __attribute__((target("neon"))) float16x4x2_t vzip_f16(float16x4_t __p0, float16x4_t __p1) { 35335 float16x4x2_t __ret; 35336 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 35337 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 35338 __builtin_neon_vzip_v(&__ret, (int8x8_t)__rev0, (int8x8_t)__rev1, 8); 35339 35340 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); 35341 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); 35342 return __ret; 35343 } 35344 #endif 35345 35346 #ifdef __LITTLE_ENDIAN__ 35347 __ai __attribute__((target("v8.1a,neon"))) int32x4_t vqrdmlahq_s32(int32x4_t __p0, int32x4_t __p1, int32x4_t __p2) { 35348 int32x4_t __ret; 35349 __ret = (int32x4_t) __builtin_neon_vqrdmlahq_s32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 34); 35350 return __ret; 35351 } 35352 #else 35353 __ai __attribute__((target("v8.1a,neon"))) int32x4_t vqrdmlahq_s32(int32x4_t __p0, int32x4_t __p1, int32x4_t __p2) { 35354 int32x4_t __ret; 35355 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 35356 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 35357 int32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 35358 __ret = (int32x4_t) __builtin_neon_vqrdmlahq_s32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 34); 35359 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 35360 return __ret; 35361 } 35362 __ai __attribute__((target("v8.1a,neon"))) int32x4_t __noswap_vqrdmlahq_s32(int32x4_t __p0, int32x4_t __p1, int32x4_t __p2) { 35363 int32x4_t __ret; 35364 __ret = (int32x4_t) __builtin_neon_vqrdmlahq_s32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 34); 35365 return __ret; 35366 } 35367 #endif 35368 35369 #ifdef __LITTLE_ENDIAN__ 35370 __ai __attribute__((target("v8.1a,neon"))) int16x8_t vqrdmlahq_s16(int16x8_t __p0, int16x8_t __p1, int16x8_t __p2) { 35371 int16x8_t __ret; 35372 __ret = (int16x8_t) __builtin_neon_vqrdmlahq_s16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 33); 35373 return __ret; 35374 } 35375 #else 35376 __ai __attribute__((target("v8.1a,neon"))) int16x8_t vqrdmlahq_s16(int16x8_t __p0, int16x8_t __p1, int16x8_t __p2) { 35377 int16x8_t __ret; 35378 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 35379 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 35380 int16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 35381 __ret = (int16x8_t) __builtin_neon_vqrdmlahq_s16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 33); 35382 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 35383 return __ret; 35384 } 35385 __ai __attribute__((target("v8.1a,neon"))) int16x8_t __noswap_vqrdmlahq_s16(int16x8_t __p0, int16x8_t __p1, int16x8_t __p2) { 35386 int16x8_t __ret; 35387 __ret = (int16x8_t) __builtin_neon_vqrdmlahq_s16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 33); 35388 return __ret; 35389 } 35390 #endif 35391 35392 #ifdef __LITTLE_ENDIAN__ 35393 __ai __attribute__((target("v8.1a,neon"))) int32x2_t vqrdmlah_s32(int32x2_t __p0, int32x2_t __p1, int32x2_t __p2) { 35394 int32x2_t __ret; 35395 __ret = (int32x2_t) __builtin_neon_vqrdmlah_s32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 2); 35396 return __ret; 35397 } 35398 #else 35399 __ai __attribute__((target("v8.1a,neon"))) int32x2_t vqrdmlah_s32(int32x2_t __p0, int32x2_t __p1, int32x2_t __p2) { 35400 int32x2_t __ret; 35401 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 35402 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 35403 int32x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 35404 __ret = (int32x2_t) __builtin_neon_vqrdmlah_s32((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 2); 35405 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 35406 return __ret; 35407 } 35408 __ai __attribute__((target("v8.1a,neon"))) int32x2_t __noswap_vqrdmlah_s32(int32x2_t __p0, int32x2_t __p1, int32x2_t __p2) { 35409 int32x2_t __ret; 35410 __ret = (int32x2_t) __builtin_neon_vqrdmlah_s32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 2); 35411 return __ret; 35412 } 35413 #endif 35414 35415 #ifdef __LITTLE_ENDIAN__ 35416 __ai __attribute__((target("v8.1a,neon"))) int16x4_t vqrdmlah_s16(int16x4_t __p0, int16x4_t __p1, int16x4_t __p2) { 35417 int16x4_t __ret; 35418 __ret = (int16x4_t) __builtin_neon_vqrdmlah_s16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 1); 35419 return __ret; 35420 } 35421 #else 35422 __ai __attribute__((target("v8.1a,neon"))) int16x4_t vqrdmlah_s16(int16x4_t __p0, int16x4_t __p1, int16x4_t __p2) { 35423 int16x4_t __ret; 35424 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 35425 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 35426 int16x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 35427 __ret = (int16x4_t) __builtin_neon_vqrdmlah_s16((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 1); 35428 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 35429 return __ret; 35430 } 35431 __ai __attribute__((target("v8.1a,neon"))) int16x4_t __noswap_vqrdmlah_s16(int16x4_t __p0, int16x4_t __p1, int16x4_t __p2) { 35432 int16x4_t __ret; 35433 __ret = (int16x4_t) __builtin_neon_vqrdmlah_s16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 1); 35434 return __ret; 35435 } 35436 #endif 35437 35438 #ifdef __LITTLE_ENDIAN__ 35439 #define vqrdmlahq_lane_s32(__p0_134, __p1_134, __p2_134, __p3_134) __extension__ ({ \ 35440 int32x4_t __ret_134; \ 35441 int32x4_t __s0_134 = __p0_134; \ 35442 int32x4_t __s1_134 = __p1_134; \ 35443 int32x2_t __s2_134 = __p2_134; \ 35444 __ret_134 = vqrdmlahq_s32(__s0_134, __s1_134, splatq_lane_s32(__s2_134, __p3_134)); \ 35445 __ret_134; \ 35446 }) 35447 #else 35448 #define vqrdmlahq_lane_s32(__p0_135, __p1_135, __p2_135, __p3_135) __extension__ ({ \ 35449 int32x4_t __ret_135; \ 35450 int32x4_t __s0_135 = __p0_135; \ 35451 int32x4_t __s1_135 = __p1_135; \ 35452 int32x2_t __s2_135 = __p2_135; \ 35453 int32x4_t __rev0_135; __rev0_135 = __builtin_shufflevector(__s0_135, __s0_135, 3, 2, 1, 0); \ 35454 int32x4_t __rev1_135; __rev1_135 = __builtin_shufflevector(__s1_135, __s1_135, 3, 2, 1, 0); \ 35455 int32x2_t __rev2_135; __rev2_135 = __builtin_shufflevector(__s2_135, __s2_135, 1, 0); \ 35456 __ret_135 = __noswap_vqrdmlahq_s32(__rev0_135, __rev1_135, __noswap_splatq_lane_s32(__rev2_135, __p3_135)); \ 35457 __ret_135 = __builtin_shufflevector(__ret_135, __ret_135, 3, 2, 1, 0); \ 35458 __ret_135; \ 35459 }) 35460 #endif 35461 35462 #ifdef __LITTLE_ENDIAN__ 35463 #define vqrdmlahq_lane_s16(__p0_136, __p1_136, __p2_136, __p3_136) __extension__ ({ \ 35464 int16x8_t __ret_136; \ 35465 int16x8_t __s0_136 = __p0_136; \ 35466 int16x8_t __s1_136 = __p1_136; \ 35467 int16x4_t __s2_136 = __p2_136; \ 35468 __ret_136 = vqrdmlahq_s16(__s0_136, __s1_136, splatq_lane_s16(__s2_136, __p3_136)); \ 35469 __ret_136; \ 35470 }) 35471 #else 35472 #define vqrdmlahq_lane_s16(__p0_137, __p1_137, __p2_137, __p3_137) __extension__ ({ \ 35473 int16x8_t __ret_137; \ 35474 int16x8_t __s0_137 = __p0_137; \ 35475 int16x8_t __s1_137 = __p1_137; \ 35476 int16x4_t __s2_137 = __p2_137; \ 35477 int16x8_t __rev0_137; __rev0_137 = __builtin_shufflevector(__s0_137, __s0_137, 7, 6, 5, 4, 3, 2, 1, 0); \ 35478 int16x8_t __rev1_137; __rev1_137 = __builtin_shufflevector(__s1_137, __s1_137, 7, 6, 5, 4, 3, 2, 1, 0); \ 35479 int16x4_t __rev2_137; __rev2_137 = __builtin_shufflevector(__s2_137, __s2_137, 3, 2, 1, 0); \ 35480 __ret_137 = __noswap_vqrdmlahq_s16(__rev0_137, __rev1_137, __noswap_splatq_lane_s16(__rev2_137, __p3_137)); \ 35481 __ret_137 = __builtin_shufflevector(__ret_137, __ret_137, 7, 6, 5, 4, 3, 2, 1, 0); \ 35482 __ret_137; \ 35483 }) 35484 #endif 35485 35486 #ifdef __LITTLE_ENDIAN__ 35487 #define vqrdmlah_lane_s32(__p0_138, __p1_138, __p2_138, __p3_138) __extension__ ({ \ 35488 int32x2_t __ret_138; \ 35489 int32x2_t __s0_138 = __p0_138; \ 35490 int32x2_t __s1_138 = __p1_138; \ 35491 int32x2_t __s2_138 = __p2_138; \ 35492 __ret_138 = vqrdmlah_s32(__s0_138, __s1_138, splat_lane_s32(__s2_138, __p3_138)); \ 35493 __ret_138; \ 35494 }) 35495 #else 35496 #define vqrdmlah_lane_s32(__p0_139, __p1_139, __p2_139, __p3_139) __extension__ ({ \ 35497 int32x2_t __ret_139; \ 35498 int32x2_t __s0_139 = __p0_139; \ 35499 int32x2_t __s1_139 = __p1_139; \ 35500 int32x2_t __s2_139 = __p2_139; \ 35501 int32x2_t __rev0_139; __rev0_139 = __builtin_shufflevector(__s0_139, __s0_139, 1, 0); \ 35502 int32x2_t __rev1_139; __rev1_139 = __builtin_shufflevector(__s1_139, __s1_139, 1, 0); \ 35503 int32x2_t __rev2_139; __rev2_139 = __builtin_shufflevector(__s2_139, __s2_139, 1, 0); \ 35504 __ret_139 = __noswap_vqrdmlah_s32(__rev0_139, __rev1_139, __noswap_splat_lane_s32(__rev2_139, __p3_139)); \ 35505 __ret_139 = __builtin_shufflevector(__ret_139, __ret_139, 1, 0); \ 35506 __ret_139; \ 35507 }) 35508 #endif 35509 35510 #ifdef __LITTLE_ENDIAN__ 35511 #define vqrdmlah_lane_s16(__p0_140, __p1_140, __p2_140, __p3_140) __extension__ ({ \ 35512 int16x4_t __ret_140; \ 35513 int16x4_t __s0_140 = __p0_140; \ 35514 int16x4_t __s1_140 = __p1_140; \ 35515 int16x4_t __s2_140 = __p2_140; \ 35516 __ret_140 = vqrdmlah_s16(__s0_140, __s1_140, splat_lane_s16(__s2_140, __p3_140)); \ 35517 __ret_140; \ 35518 }) 35519 #else 35520 #define vqrdmlah_lane_s16(__p0_141, __p1_141, __p2_141, __p3_141) __extension__ ({ \ 35521 int16x4_t __ret_141; \ 35522 int16x4_t __s0_141 = __p0_141; \ 35523 int16x4_t __s1_141 = __p1_141; \ 35524 int16x4_t __s2_141 = __p2_141; \ 35525 int16x4_t __rev0_141; __rev0_141 = __builtin_shufflevector(__s0_141, __s0_141, 3, 2, 1, 0); \ 35526 int16x4_t __rev1_141; __rev1_141 = __builtin_shufflevector(__s1_141, __s1_141, 3, 2, 1, 0); \ 35527 int16x4_t __rev2_141; __rev2_141 = __builtin_shufflevector(__s2_141, __s2_141, 3, 2, 1, 0); \ 35528 __ret_141 = __noswap_vqrdmlah_s16(__rev0_141, __rev1_141, __noswap_splat_lane_s16(__rev2_141, __p3_141)); \ 35529 __ret_141 = __builtin_shufflevector(__ret_141, __ret_141, 3, 2, 1, 0); \ 35530 __ret_141; \ 35531 }) 35532 #endif 35533 35534 #ifdef __LITTLE_ENDIAN__ 35535 __ai __attribute__((target("v8.1a,neon"))) int32x4_t vqrdmlshq_s32(int32x4_t __p0, int32x4_t __p1, int32x4_t __p2) { 35536 int32x4_t __ret; 35537 __ret = (int32x4_t) __builtin_neon_vqrdmlshq_s32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 34); 35538 return __ret; 35539 } 35540 #else 35541 __ai __attribute__((target("v8.1a,neon"))) int32x4_t vqrdmlshq_s32(int32x4_t __p0, int32x4_t __p1, int32x4_t __p2) { 35542 int32x4_t __ret; 35543 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 35544 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 35545 int32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 35546 __ret = (int32x4_t) __builtin_neon_vqrdmlshq_s32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 34); 35547 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 35548 return __ret; 35549 } 35550 __ai __attribute__((target("v8.1a,neon"))) int32x4_t __noswap_vqrdmlshq_s32(int32x4_t __p0, int32x4_t __p1, int32x4_t __p2) { 35551 int32x4_t __ret; 35552 __ret = (int32x4_t) __builtin_neon_vqrdmlshq_s32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 34); 35553 return __ret; 35554 } 35555 #endif 35556 35557 #ifdef __LITTLE_ENDIAN__ 35558 __ai __attribute__((target("v8.1a,neon"))) int16x8_t vqrdmlshq_s16(int16x8_t __p0, int16x8_t __p1, int16x8_t __p2) { 35559 int16x8_t __ret; 35560 __ret = (int16x8_t) __builtin_neon_vqrdmlshq_s16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 33); 35561 return __ret; 35562 } 35563 #else 35564 __ai __attribute__((target("v8.1a,neon"))) int16x8_t vqrdmlshq_s16(int16x8_t __p0, int16x8_t __p1, int16x8_t __p2) { 35565 int16x8_t __ret; 35566 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 35567 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 35568 int16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 35569 __ret = (int16x8_t) __builtin_neon_vqrdmlshq_s16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 33); 35570 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 35571 return __ret; 35572 } 35573 __ai __attribute__((target("v8.1a,neon"))) int16x8_t __noswap_vqrdmlshq_s16(int16x8_t __p0, int16x8_t __p1, int16x8_t __p2) { 35574 int16x8_t __ret; 35575 __ret = (int16x8_t) __builtin_neon_vqrdmlshq_s16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 33); 35576 return __ret; 35577 } 35578 #endif 35579 35580 #ifdef __LITTLE_ENDIAN__ 35581 __ai __attribute__((target("v8.1a,neon"))) int32x2_t vqrdmlsh_s32(int32x2_t __p0, int32x2_t __p1, int32x2_t __p2) { 35582 int32x2_t __ret; 35583 __ret = (int32x2_t) __builtin_neon_vqrdmlsh_s32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 2); 35584 return __ret; 35585 } 35586 #else 35587 __ai __attribute__((target("v8.1a,neon"))) int32x2_t vqrdmlsh_s32(int32x2_t __p0, int32x2_t __p1, int32x2_t __p2) { 35588 int32x2_t __ret; 35589 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 35590 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 35591 int32x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 35592 __ret = (int32x2_t) __builtin_neon_vqrdmlsh_s32((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 2); 35593 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 35594 return __ret; 35595 } 35596 __ai __attribute__((target("v8.1a,neon"))) int32x2_t __noswap_vqrdmlsh_s32(int32x2_t __p0, int32x2_t __p1, int32x2_t __p2) { 35597 int32x2_t __ret; 35598 __ret = (int32x2_t) __builtin_neon_vqrdmlsh_s32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 2); 35599 return __ret; 35600 } 35601 #endif 35602 35603 #ifdef __LITTLE_ENDIAN__ 35604 __ai __attribute__((target("v8.1a,neon"))) int16x4_t vqrdmlsh_s16(int16x4_t __p0, int16x4_t __p1, int16x4_t __p2) { 35605 int16x4_t __ret; 35606 __ret = (int16x4_t) __builtin_neon_vqrdmlsh_s16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 1); 35607 return __ret; 35608 } 35609 #else 35610 __ai __attribute__((target("v8.1a,neon"))) int16x4_t vqrdmlsh_s16(int16x4_t __p0, int16x4_t __p1, int16x4_t __p2) { 35611 int16x4_t __ret; 35612 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 35613 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 35614 int16x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 35615 __ret = (int16x4_t) __builtin_neon_vqrdmlsh_s16((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 1); 35616 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 35617 return __ret; 35618 } 35619 __ai __attribute__((target("v8.1a,neon"))) int16x4_t __noswap_vqrdmlsh_s16(int16x4_t __p0, int16x4_t __p1, int16x4_t __p2) { 35620 int16x4_t __ret; 35621 __ret = (int16x4_t) __builtin_neon_vqrdmlsh_s16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 1); 35622 return __ret; 35623 } 35624 #endif 35625 35626 #ifdef __LITTLE_ENDIAN__ 35627 #define vqrdmlshq_lane_s32(__p0_142, __p1_142, __p2_142, __p3_142) __extension__ ({ \ 35628 int32x4_t __ret_142; \ 35629 int32x4_t __s0_142 = __p0_142; \ 35630 int32x4_t __s1_142 = __p1_142; \ 35631 int32x2_t __s2_142 = __p2_142; \ 35632 __ret_142 = vqrdmlshq_s32(__s0_142, __s1_142, splatq_lane_s32(__s2_142, __p3_142)); \ 35633 __ret_142; \ 35634 }) 35635 #else 35636 #define vqrdmlshq_lane_s32(__p0_143, __p1_143, __p2_143, __p3_143) __extension__ ({ \ 35637 int32x4_t __ret_143; \ 35638 int32x4_t __s0_143 = __p0_143; \ 35639 int32x4_t __s1_143 = __p1_143; \ 35640 int32x2_t __s2_143 = __p2_143; \ 35641 int32x4_t __rev0_143; __rev0_143 = __builtin_shufflevector(__s0_143, __s0_143, 3, 2, 1, 0); \ 35642 int32x4_t __rev1_143; __rev1_143 = __builtin_shufflevector(__s1_143, __s1_143, 3, 2, 1, 0); \ 35643 int32x2_t __rev2_143; __rev2_143 = __builtin_shufflevector(__s2_143, __s2_143, 1, 0); \ 35644 __ret_143 = __noswap_vqrdmlshq_s32(__rev0_143, __rev1_143, __noswap_splatq_lane_s32(__rev2_143, __p3_143)); \ 35645 __ret_143 = __builtin_shufflevector(__ret_143, __ret_143, 3, 2, 1, 0); \ 35646 __ret_143; \ 35647 }) 35648 #endif 35649 35650 #ifdef __LITTLE_ENDIAN__ 35651 #define vqrdmlshq_lane_s16(__p0_144, __p1_144, __p2_144, __p3_144) __extension__ ({ \ 35652 int16x8_t __ret_144; \ 35653 int16x8_t __s0_144 = __p0_144; \ 35654 int16x8_t __s1_144 = __p1_144; \ 35655 int16x4_t __s2_144 = __p2_144; \ 35656 __ret_144 = vqrdmlshq_s16(__s0_144, __s1_144, splatq_lane_s16(__s2_144, __p3_144)); \ 35657 __ret_144; \ 35658 }) 35659 #else 35660 #define vqrdmlshq_lane_s16(__p0_145, __p1_145, __p2_145, __p3_145) __extension__ ({ \ 35661 int16x8_t __ret_145; \ 35662 int16x8_t __s0_145 = __p0_145; \ 35663 int16x8_t __s1_145 = __p1_145; \ 35664 int16x4_t __s2_145 = __p2_145; \ 35665 int16x8_t __rev0_145; __rev0_145 = __builtin_shufflevector(__s0_145, __s0_145, 7, 6, 5, 4, 3, 2, 1, 0); \ 35666 int16x8_t __rev1_145; __rev1_145 = __builtin_shufflevector(__s1_145, __s1_145, 7, 6, 5, 4, 3, 2, 1, 0); \ 35667 int16x4_t __rev2_145; __rev2_145 = __builtin_shufflevector(__s2_145, __s2_145, 3, 2, 1, 0); \ 35668 __ret_145 = __noswap_vqrdmlshq_s16(__rev0_145, __rev1_145, __noswap_splatq_lane_s16(__rev2_145, __p3_145)); \ 35669 __ret_145 = __builtin_shufflevector(__ret_145, __ret_145, 7, 6, 5, 4, 3, 2, 1, 0); \ 35670 __ret_145; \ 35671 }) 35672 #endif 35673 35674 #ifdef __LITTLE_ENDIAN__ 35675 #define vqrdmlsh_lane_s32(__p0_146, __p1_146, __p2_146, __p3_146) __extension__ ({ \ 35676 int32x2_t __ret_146; \ 35677 int32x2_t __s0_146 = __p0_146; \ 35678 int32x2_t __s1_146 = __p1_146; \ 35679 int32x2_t __s2_146 = __p2_146; \ 35680 __ret_146 = vqrdmlsh_s32(__s0_146, __s1_146, splat_lane_s32(__s2_146, __p3_146)); \ 35681 __ret_146; \ 35682 }) 35683 #else 35684 #define vqrdmlsh_lane_s32(__p0_147, __p1_147, __p2_147, __p3_147) __extension__ ({ \ 35685 int32x2_t __ret_147; \ 35686 int32x2_t __s0_147 = __p0_147; \ 35687 int32x2_t __s1_147 = __p1_147; \ 35688 int32x2_t __s2_147 = __p2_147; \ 35689 int32x2_t __rev0_147; __rev0_147 = __builtin_shufflevector(__s0_147, __s0_147, 1, 0); \ 35690 int32x2_t __rev1_147; __rev1_147 = __builtin_shufflevector(__s1_147, __s1_147, 1, 0); \ 35691 int32x2_t __rev2_147; __rev2_147 = __builtin_shufflevector(__s2_147, __s2_147, 1, 0); \ 35692 __ret_147 = __noswap_vqrdmlsh_s32(__rev0_147, __rev1_147, __noswap_splat_lane_s32(__rev2_147, __p3_147)); \ 35693 __ret_147 = __builtin_shufflevector(__ret_147, __ret_147, 1, 0); \ 35694 __ret_147; \ 35695 }) 35696 #endif 35697 35698 #ifdef __LITTLE_ENDIAN__ 35699 #define vqrdmlsh_lane_s16(__p0_148, __p1_148, __p2_148, __p3_148) __extension__ ({ \ 35700 int16x4_t __ret_148; \ 35701 int16x4_t __s0_148 = __p0_148; \ 35702 int16x4_t __s1_148 = __p1_148; \ 35703 int16x4_t __s2_148 = __p2_148; \ 35704 __ret_148 = vqrdmlsh_s16(__s0_148, __s1_148, splat_lane_s16(__s2_148, __p3_148)); \ 35705 __ret_148; \ 35706 }) 35707 #else 35708 #define vqrdmlsh_lane_s16(__p0_149, __p1_149, __p2_149, __p3_149) __extension__ ({ \ 35709 int16x4_t __ret_149; \ 35710 int16x4_t __s0_149 = __p0_149; \ 35711 int16x4_t __s1_149 = __p1_149; \ 35712 int16x4_t __s2_149 = __p2_149; \ 35713 int16x4_t __rev0_149; __rev0_149 = __builtin_shufflevector(__s0_149, __s0_149, 3, 2, 1, 0); \ 35714 int16x4_t __rev1_149; __rev1_149 = __builtin_shufflevector(__s1_149, __s1_149, 3, 2, 1, 0); \ 35715 int16x4_t __rev2_149; __rev2_149 = __builtin_shufflevector(__s2_149, __s2_149, 3, 2, 1, 0); \ 35716 __ret_149 = __noswap_vqrdmlsh_s16(__rev0_149, __rev1_149, __noswap_splat_lane_s16(__rev2_149, __p3_149)); \ 35717 __ret_149 = __builtin_shufflevector(__ret_149, __ret_149, 3, 2, 1, 0); \ 35718 __ret_149; \ 35719 }) 35720 #endif 35721 35722 #ifdef __LITTLE_ENDIAN__ 35723 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x4_t vcadd_rot270_f16(float16x4_t __p0, float16x4_t __p1) { 35724 float16x4_t __ret; 35725 __ret = (float16x4_t) __builtin_neon_vcadd_rot270_f16((int8x8_t)__p0, (int8x8_t)__p1, 8); 35726 return __ret; 35727 } 35728 #else 35729 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x4_t vcadd_rot270_f16(float16x4_t __p0, float16x4_t __p1) { 35730 float16x4_t __ret; 35731 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 35732 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 35733 __ret = (float16x4_t) __builtin_neon_vcadd_rot270_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8); 35734 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 35735 return __ret; 35736 } 35737 #endif 35738 35739 #ifdef __LITTLE_ENDIAN__ 35740 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x4_t vcadd_rot90_f16(float16x4_t __p0, float16x4_t __p1) { 35741 float16x4_t __ret; 35742 __ret = (float16x4_t) __builtin_neon_vcadd_rot90_f16((int8x8_t)__p0, (int8x8_t)__p1, 8); 35743 return __ret; 35744 } 35745 #else 35746 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x4_t vcadd_rot90_f16(float16x4_t __p0, float16x4_t __p1) { 35747 float16x4_t __ret; 35748 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 35749 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 35750 __ret = (float16x4_t) __builtin_neon_vcadd_rot90_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8); 35751 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 35752 return __ret; 35753 } 35754 #endif 35755 35756 #ifdef __LITTLE_ENDIAN__ 35757 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x8_t vcaddq_rot270_f16(float16x8_t __p0, float16x8_t __p1) { 35758 float16x8_t __ret; 35759 __ret = (float16x8_t) __builtin_neon_vcaddq_rot270_f16((int8x16_t)__p0, (int8x16_t)__p1, 40); 35760 return __ret; 35761 } 35762 #else 35763 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x8_t vcaddq_rot270_f16(float16x8_t __p0, float16x8_t __p1) { 35764 float16x8_t __ret; 35765 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 35766 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 35767 __ret = (float16x8_t) __builtin_neon_vcaddq_rot270_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40); 35768 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 35769 return __ret; 35770 } 35771 #endif 35772 35773 #ifdef __LITTLE_ENDIAN__ 35774 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x8_t vcaddq_rot90_f16(float16x8_t __p0, float16x8_t __p1) { 35775 float16x8_t __ret; 35776 __ret = (float16x8_t) __builtin_neon_vcaddq_rot90_f16((int8x16_t)__p0, (int8x16_t)__p1, 40); 35777 return __ret; 35778 } 35779 #else 35780 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x8_t vcaddq_rot90_f16(float16x8_t __p0, float16x8_t __p1) { 35781 float16x8_t __ret; 35782 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 35783 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 35784 __ret = (float16x8_t) __builtin_neon_vcaddq_rot90_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40); 35785 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 35786 return __ret; 35787 } 35788 #endif 35789 35790 #ifdef __LITTLE_ENDIAN__ 35791 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x8_t vcmlaq_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) { 35792 float16x8_t __ret; 35793 __ret = (float16x8_t) __builtin_neon_vcmlaq_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 40); 35794 return __ret; 35795 } 35796 #else 35797 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x8_t vcmlaq_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) { 35798 float16x8_t __ret; 35799 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 35800 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 35801 float16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 35802 __ret = (float16x8_t) __builtin_neon_vcmlaq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 40); 35803 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 35804 return __ret; 35805 } 35806 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x8_t __noswap_vcmlaq_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) { 35807 float16x8_t __ret; 35808 __ret = (float16x8_t) __builtin_neon_vcmlaq_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 40); 35809 return __ret; 35810 } 35811 #endif 35812 35813 #ifdef __LITTLE_ENDIAN__ 35814 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x4_t vcmla_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) { 35815 float16x4_t __ret; 35816 __ret = (float16x4_t) __builtin_neon_vcmla_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 8); 35817 return __ret; 35818 } 35819 #else 35820 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x4_t vcmla_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) { 35821 float16x4_t __ret; 35822 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 35823 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 35824 float16x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 35825 __ret = (float16x4_t) __builtin_neon_vcmla_f16((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 8); 35826 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 35827 return __ret; 35828 } 35829 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x4_t __noswap_vcmla_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) { 35830 float16x4_t __ret; 35831 __ret = (float16x4_t) __builtin_neon_vcmla_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 8); 35832 return __ret; 35833 } 35834 #endif 35835 35836 #ifdef __LITTLE_ENDIAN__ 35837 #define vcmla_lane_f16(__p0_150, __p1_150, __p2_150, __p3_150) __extension__ ({ \ 35838 float16x4_t __ret_150; \ 35839 float16x4_t __s0_150 = __p0_150; \ 35840 float16x4_t __s1_150 = __p1_150; \ 35841 float16x4_t __s2_150 = __p2_150; \ 35842 __ret_150 = vcmla_f16(__s0_150, __s1_150, __builtin_bit_cast(float16x4_t, (uint32x2_t) {vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_150), __p3_150), vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_150), __p3_150)})); \ 35843 __ret_150; \ 35844 }) 35845 #else 35846 #define vcmla_lane_f16(__p0_151, __p1_151, __p2_151, __p3_151) __extension__ ({ \ 35847 float16x4_t __ret_151; \ 35848 float16x4_t __s0_151 = __p0_151; \ 35849 float16x4_t __s1_151 = __p1_151; \ 35850 float16x4_t __s2_151 = __p2_151; \ 35851 float16x4_t __rev0_151; __rev0_151 = __builtin_shufflevector(__s0_151, __s0_151, 3, 2, 1, 0); \ 35852 float16x4_t __rev1_151; __rev1_151 = __builtin_shufflevector(__s1_151, __s1_151, 3, 2, 1, 0); \ 35853 float16x4_t __rev2_151; __rev2_151 = __builtin_shufflevector(__s2_151, __s2_151, 3, 2, 1, 0); \ 35854 __ret_151 = __noswap_vcmla_f16(__rev0_151, __rev1_151, __builtin_bit_cast(float16x4_t, (uint32x2_t) {__noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_151), __p3_151), __noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_151), __p3_151)})); \ 35855 __ret_151 = __builtin_shufflevector(__ret_151, __ret_151, 3, 2, 1, 0); \ 35856 __ret_151; \ 35857 }) 35858 #endif 35859 35860 #ifdef __LITTLE_ENDIAN__ 35861 #define vcmlaq_lane_f16(__p0_152, __p1_152, __p2_152, __p3_152) __extension__ ({ \ 35862 float16x8_t __ret_152; \ 35863 float16x8_t __s0_152 = __p0_152; \ 35864 float16x8_t __s1_152 = __p1_152; \ 35865 float16x4_t __s2_152 = __p2_152; \ 35866 __ret_152 = vcmlaq_f16(__s0_152, __s1_152, __builtin_bit_cast(float16x8_t, (uint32x4_t) {vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_152), __p3_152), vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_152), __p3_152), vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_152), __p3_152), vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_152), __p3_152)})); \ 35867 __ret_152; \ 35868 }) 35869 #else 35870 #define vcmlaq_lane_f16(__p0_153, __p1_153, __p2_153, __p3_153) __extension__ ({ \ 35871 float16x8_t __ret_153; \ 35872 float16x8_t __s0_153 = __p0_153; \ 35873 float16x8_t __s1_153 = __p1_153; \ 35874 float16x4_t __s2_153 = __p2_153; \ 35875 float16x8_t __rev0_153; __rev0_153 = __builtin_shufflevector(__s0_153, __s0_153, 7, 6, 5, 4, 3, 2, 1, 0); \ 35876 float16x8_t __rev1_153; __rev1_153 = __builtin_shufflevector(__s1_153, __s1_153, 7, 6, 5, 4, 3, 2, 1, 0); \ 35877 float16x4_t __rev2_153; __rev2_153 = __builtin_shufflevector(__s2_153, __s2_153, 3, 2, 1, 0); \ 35878 __ret_153 = __noswap_vcmlaq_f16(__rev0_153, __rev1_153, __builtin_bit_cast(float16x8_t, (uint32x4_t) {__noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_153), __p3_153), __noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_153), __p3_153), __noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_153), __p3_153), __noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_153), __p3_153)})); \ 35879 __ret_153 = __builtin_shufflevector(__ret_153, __ret_153, 7, 6, 5, 4, 3, 2, 1, 0); \ 35880 __ret_153; \ 35881 }) 35882 #endif 35883 35884 #ifdef __LITTLE_ENDIAN__ 35885 #define vcmla_laneq_f16(__p0_154, __p1_154, __p2_154, __p3_154) __extension__ ({ \ 35886 float16x4_t __ret_154; \ 35887 float16x4_t __s0_154 = __p0_154; \ 35888 float16x4_t __s1_154 = __p1_154; \ 35889 float16x8_t __s2_154 = __p2_154; \ 35890 __ret_154 = vcmla_f16(__s0_154, __s1_154, __builtin_bit_cast(float16x4_t, (uint32x2_t) {vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_154), __p3_154), vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_154), __p3_154)})); \ 35891 __ret_154; \ 35892 }) 35893 #else 35894 #define vcmla_laneq_f16(__p0_155, __p1_155, __p2_155, __p3_155) __extension__ ({ \ 35895 float16x4_t __ret_155; \ 35896 float16x4_t __s0_155 = __p0_155; \ 35897 float16x4_t __s1_155 = __p1_155; \ 35898 float16x8_t __s2_155 = __p2_155; \ 35899 float16x4_t __rev0_155; __rev0_155 = __builtin_shufflevector(__s0_155, __s0_155, 3, 2, 1, 0); \ 35900 float16x4_t __rev1_155; __rev1_155 = __builtin_shufflevector(__s1_155, __s1_155, 3, 2, 1, 0); \ 35901 float16x8_t __rev2_155; __rev2_155 = __builtin_shufflevector(__s2_155, __s2_155, 7, 6, 5, 4, 3, 2, 1, 0); \ 35902 __ret_155 = __noswap_vcmla_f16(__rev0_155, __rev1_155, __builtin_bit_cast(float16x4_t, (uint32x2_t) {__noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_155), __p3_155), __noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_155), __p3_155)})); \ 35903 __ret_155 = __builtin_shufflevector(__ret_155, __ret_155, 3, 2, 1, 0); \ 35904 __ret_155; \ 35905 }) 35906 #endif 35907 35908 #ifdef __LITTLE_ENDIAN__ 35909 #define vcmlaq_laneq_f16(__p0_156, __p1_156, __p2_156, __p3_156) __extension__ ({ \ 35910 float16x8_t __ret_156; \ 35911 float16x8_t __s0_156 = __p0_156; \ 35912 float16x8_t __s1_156 = __p1_156; \ 35913 float16x8_t __s2_156 = __p2_156; \ 35914 __ret_156 = vcmlaq_f16(__s0_156, __s1_156, __builtin_bit_cast(float16x8_t, (uint32x4_t) {vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_156), __p3_156), vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_156), __p3_156), vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_156), __p3_156), vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_156), __p3_156)})); \ 35915 __ret_156; \ 35916 }) 35917 #else 35918 #define vcmlaq_laneq_f16(__p0_157, __p1_157, __p2_157, __p3_157) __extension__ ({ \ 35919 float16x8_t __ret_157; \ 35920 float16x8_t __s0_157 = __p0_157; \ 35921 float16x8_t __s1_157 = __p1_157; \ 35922 float16x8_t __s2_157 = __p2_157; \ 35923 float16x8_t __rev0_157; __rev0_157 = __builtin_shufflevector(__s0_157, __s0_157, 7, 6, 5, 4, 3, 2, 1, 0); \ 35924 float16x8_t __rev1_157; __rev1_157 = __builtin_shufflevector(__s1_157, __s1_157, 7, 6, 5, 4, 3, 2, 1, 0); \ 35925 float16x8_t __rev2_157; __rev2_157 = __builtin_shufflevector(__s2_157, __s2_157, 7, 6, 5, 4, 3, 2, 1, 0); \ 35926 __ret_157 = __noswap_vcmlaq_f16(__rev0_157, __rev1_157, __builtin_bit_cast(float16x8_t, (uint32x4_t) {__noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_157), __p3_157), __noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_157), __p3_157), __noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_157), __p3_157), __noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_157), __p3_157)})); \ 35927 __ret_157 = __builtin_shufflevector(__ret_157, __ret_157, 7, 6, 5, 4, 3, 2, 1, 0); \ 35928 __ret_157; \ 35929 }) 35930 #endif 35931 35932 #ifdef __LITTLE_ENDIAN__ 35933 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x8_t vcmlaq_rot180_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) { 35934 float16x8_t __ret; 35935 __ret = (float16x8_t) __builtin_neon_vcmlaq_rot180_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 40); 35936 return __ret; 35937 } 35938 #else 35939 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x8_t vcmlaq_rot180_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) { 35940 float16x8_t __ret; 35941 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 35942 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 35943 float16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 35944 __ret = (float16x8_t) __builtin_neon_vcmlaq_rot180_f16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 40); 35945 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 35946 return __ret; 35947 } 35948 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x8_t __noswap_vcmlaq_rot180_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) { 35949 float16x8_t __ret; 35950 __ret = (float16x8_t) __builtin_neon_vcmlaq_rot180_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 40); 35951 return __ret; 35952 } 35953 #endif 35954 35955 #ifdef __LITTLE_ENDIAN__ 35956 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x4_t vcmla_rot180_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) { 35957 float16x4_t __ret; 35958 __ret = (float16x4_t) __builtin_neon_vcmla_rot180_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 8); 35959 return __ret; 35960 } 35961 #else 35962 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x4_t vcmla_rot180_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) { 35963 float16x4_t __ret; 35964 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 35965 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 35966 float16x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 35967 __ret = (float16x4_t) __builtin_neon_vcmla_rot180_f16((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 8); 35968 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 35969 return __ret; 35970 } 35971 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x4_t __noswap_vcmla_rot180_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) { 35972 float16x4_t __ret; 35973 __ret = (float16x4_t) __builtin_neon_vcmla_rot180_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 8); 35974 return __ret; 35975 } 35976 #endif 35977 35978 #ifdef __LITTLE_ENDIAN__ 35979 #define vcmla_rot180_lane_f16(__p0_158, __p1_158, __p2_158, __p3_158) __extension__ ({ \ 35980 float16x4_t __ret_158; \ 35981 float16x4_t __s0_158 = __p0_158; \ 35982 float16x4_t __s1_158 = __p1_158; \ 35983 float16x4_t __s2_158 = __p2_158; \ 35984 __ret_158 = vcmla_rot180_f16(__s0_158, __s1_158, __builtin_bit_cast(float16x4_t, (uint32x2_t) {vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_158), __p3_158), vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_158), __p3_158)})); \ 35985 __ret_158; \ 35986 }) 35987 #else 35988 #define vcmla_rot180_lane_f16(__p0_159, __p1_159, __p2_159, __p3_159) __extension__ ({ \ 35989 float16x4_t __ret_159; \ 35990 float16x4_t __s0_159 = __p0_159; \ 35991 float16x4_t __s1_159 = __p1_159; \ 35992 float16x4_t __s2_159 = __p2_159; \ 35993 float16x4_t __rev0_159; __rev0_159 = __builtin_shufflevector(__s0_159, __s0_159, 3, 2, 1, 0); \ 35994 float16x4_t __rev1_159; __rev1_159 = __builtin_shufflevector(__s1_159, __s1_159, 3, 2, 1, 0); \ 35995 float16x4_t __rev2_159; __rev2_159 = __builtin_shufflevector(__s2_159, __s2_159, 3, 2, 1, 0); \ 35996 __ret_159 = __noswap_vcmla_rot180_f16(__rev0_159, __rev1_159, __builtin_bit_cast(float16x4_t, (uint32x2_t) {__noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_159), __p3_159), __noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_159), __p3_159)})); \ 35997 __ret_159 = __builtin_shufflevector(__ret_159, __ret_159, 3, 2, 1, 0); \ 35998 __ret_159; \ 35999 }) 36000 #endif 36001 36002 #ifdef __LITTLE_ENDIAN__ 36003 #define vcmlaq_rot180_lane_f16(__p0_160, __p1_160, __p2_160, __p3_160) __extension__ ({ \ 36004 float16x8_t __ret_160; \ 36005 float16x8_t __s0_160 = __p0_160; \ 36006 float16x8_t __s1_160 = __p1_160; \ 36007 float16x4_t __s2_160 = __p2_160; \ 36008 __ret_160 = vcmlaq_rot180_f16(__s0_160, __s1_160, __builtin_bit_cast(float16x8_t, (uint32x4_t) {vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_160), __p3_160), vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_160), __p3_160), vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_160), __p3_160), vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_160), __p3_160)})); \ 36009 __ret_160; \ 36010 }) 36011 #else 36012 #define vcmlaq_rot180_lane_f16(__p0_161, __p1_161, __p2_161, __p3_161) __extension__ ({ \ 36013 float16x8_t __ret_161; \ 36014 float16x8_t __s0_161 = __p0_161; \ 36015 float16x8_t __s1_161 = __p1_161; \ 36016 float16x4_t __s2_161 = __p2_161; \ 36017 float16x8_t __rev0_161; __rev0_161 = __builtin_shufflevector(__s0_161, __s0_161, 7, 6, 5, 4, 3, 2, 1, 0); \ 36018 float16x8_t __rev1_161; __rev1_161 = __builtin_shufflevector(__s1_161, __s1_161, 7, 6, 5, 4, 3, 2, 1, 0); \ 36019 float16x4_t __rev2_161; __rev2_161 = __builtin_shufflevector(__s2_161, __s2_161, 3, 2, 1, 0); \ 36020 __ret_161 = __noswap_vcmlaq_rot180_f16(__rev0_161, __rev1_161, __builtin_bit_cast(float16x8_t, (uint32x4_t) {__noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_161), __p3_161), __noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_161), __p3_161), __noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_161), __p3_161), __noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_161), __p3_161)})); \ 36021 __ret_161 = __builtin_shufflevector(__ret_161, __ret_161, 7, 6, 5, 4, 3, 2, 1, 0); \ 36022 __ret_161; \ 36023 }) 36024 #endif 36025 36026 #ifdef __LITTLE_ENDIAN__ 36027 #define vcmla_rot180_laneq_f16(__p0_162, __p1_162, __p2_162, __p3_162) __extension__ ({ \ 36028 float16x4_t __ret_162; \ 36029 float16x4_t __s0_162 = __p0_162; \ 36030 float16x4_t __s1_162 = __p1_162; \ 36031 float16x8_t __s2_162 = __p2_162; \ 36032 __ret_162 = vcmla_rot180_f16(__s0_162, __s1_162, __builtin_bit_cast(float16x4_t, (uint32x2_t) {vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_162), __p3_162), vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_162), __p3_162)})); \ 36033 __ret_162; \ 36034 }) 36035 #else 36036 #define vcmla_rot180_laneq_f16(__p0_163, __p1_163, __p2_163, __p3_163) __extension__ ({ \ 36037 float16x4_t __ret_163; \ 36038 float16x4_t __s0_163 = __p0_163; \ 36039 float16x4_t __s1_163 = __p1_163; \ 36040 float16x8_t __s2_163 = __p2_163; \ 36041 float16x4_t __rev0_163; __rev0_163 = __builtin_shufflevector(__s0_163, __s0_163, 3, 2, 1, 0); \ 36042 float16x4_t __rev1_163; __rev1_163 = __builtin_shufflevector(__s1_163, __s1_163, 3, 2, 1, 0); \ 36043 float16x8_t __rev2_163; __rev2_163 = __builtin_shufflevector(__s2_163, __s2_163, 7, 6, 5, 4, 3, 2, 1, 0); \ 36044 __ret_163 = __noswap_vcmla_rot180_f16(__rev0_163, __rev1_163, __builtin_bit_cast(float16x4_t, (uint32x2_t) {__noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_163), __p3_163), __noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_163), __p3_163)})); \ 36045 __ret_163 = __builtin_shufflevector(__ret_163, __ret_163, 3, 2, 1, 0); \ 36046 __ret_163; \ 36047 }) 36048 #endif 36049 36050 #ifdef __LITTLE_ENDIAN__ 36051 #define vcmlaq_rot180_laneq_f16(__p0_164, __p1_164, __p2_164, __p3_164) __extension__ ({ \ 36052 float16x8_t __ret_164; \ 36053 float16x8_t __s0_164 = __p0_164; \ 36054 float16x8_t __s1_164 = __p1_164; \ 36055 float16x8_t __s2_164 = __p2_164; \ 36056 __ret_164 = vcmlaq_rot180_f16(__s0_164, __s1_164, __builtin_bit_cast(float16x8_t, (uint32x4_t) {vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_164), __p3_164), vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_164), __p3_164), vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_164), __p3_164), vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_164), __p3_164)})); \ 36057 __ret_164; \ 36058 }) 36059 #else 36060 #define vcmlaq_rot180_laneq_f16(__p0_165, __p1_165, __p2_165, __p3_165) __extension__ ({ \ 36061 float16x8_t __ret_165; \ 36062 float16x8_t __s0_165 = __p0_165; \ 36063 float16x8_t __s1_165 = __p1_165; \ 36064 float16x8_t __s2_165 = __p2_165; \ 36065 float16x8_t __rev0_165; __rev0_165 = __builtin_shufflevector(__s0_165, __s0_165, 7, 6, 5, 4, 3, 2, 1, 0); \ 36066 float16x8_t __rev1_165; __rev1_165 = __builtin_shufflevector(__s1_165, __s1_165, 7, 6, 5, 4, 3, 2, 1, 0); \ 36067 float16x8_t __rev2_165; __rev2_165 = __builtin_shufflevector(__s2_165, __s2_165, 7, 6, 5, 4, 3, 2, 1, 0); \ 36068 __ret_165 = __noswap_vcmlaq_rot180_f16(__rev0_165, __rev1_165, __builtin_bit_cast(float16x8_t, (uint32x4_t) {__noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_165), __p3_165), __noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_165), __p3_165), __noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_165), __p3_165), __noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_165), __p3_165)})); \ 36069 __ret_165 = __builtin_shufflevector(__ret_165, __ret_165, 7, 6, 5, 4, 3, 2, 1, 0); \ 36070 __ret_165; \ 36071 }) 36072 #endif 36073 36074 #ifdef __LITTLE_ENDIAN__ 36075 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x8_t vcmlaq_rot270_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) { 36076 float16x8_t __ret; 36077 __ret = (float16x8_t) __builtin_neon_vcmlaq_rot270_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 40); 36078 return __ret; 36079 } 36080 #else 36081 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x8_t vcmlaq_rot270_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) { 36082 float16x8_t __ret; 36083 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 36084 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 36085 float16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 36086 __ret = (float16x8_t) __builtin_neon_vcmlaq_rot270_f16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 40); 36087 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 36088 return __ret; 36089 } 36090 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x8_t __noswap_vcmlaq_rot270_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) { 36091 float16x8_t __ret; 36092 __ret = (float16x8_t) __builtin_neon_vcmlaq_rot270_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 40); 36093 return __ret; 36094 } 36095 #endif 36096 36097 #ifdef __LITTLE_ENDIAN__ 36098 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x4_t vcmla_rot270_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) { 36099 float16x4_t __ret; 36100 __ret = (float16x4_t) __builtin_neon_vcmla_rot270_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 8); 36101 return __ret; 36102 } 36103 #else 36104 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x4_t vcmla_rot270_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) { 36105 float16x4_t __ret; 36106 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 36107 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 36108 float16x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 36109 __ret = (float16x4_t) __builtin_neon_vcmla_rot270_f16((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 8); 36110 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 36111 return __ret; 36112 } 36113 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x4_t __noswap_vcmla_rot270_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) { 36114 float16x4_t __ret; 36115 __ret = (float16x4_t) __builtin_neon_vcmla_rot270_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 8); 36116 return __ret; 36117 } 36118 #endif 36119 36120 #ifdef __LITTLE_ENDIAN__ 36121 #define vcmla_rot270_lane_f16(__p0_166, __p1_166, __p2_166, __p3_166) __extension__ ({ \ 36122 float16x4_t __ret_166; \ 36123 float16x4_t __s0_166 = __p0_166; \ 36124 float16x4_t __s1_166 = __p1_166; \ 36125 float16x4_t __s2_166 = __p2_166; \ 36126 __ret_166 = vcmla_rot270_f16(__s0_166, __s1_166, __builtin_bit_cast(float16x4_t, (uint32x2_t) {vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_166), __p3_166), vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_166), __p3_166)})); \ 36127 __ret_166; \ 36128 }) 36129 #else 36130 #define vcmla_rot270_lane_f16(__p0_167, __p1_167, __p2_167, __p3_167) __extension__ ({ \ 36131 float16x4_t __ret_167; \ 36132 float16x4_t __s0_167 = __p0_167; \ 36133 float16x4_t __s1_167 = __p1_167; \ 36134 float16x4_t __s2_167 = __p2_167; \ 36135 float16x4_t __rev0_167; __rev0_167 = __builtin_shufflevector(__s0_167, __s0_167, 3, 2, 1, 0); \ 36136 float16x4_t __rev1_167; __rev1_167 = __builtin_shufflevector(__s1_167, __s1_167, 3, 2, 1, 0); \ 36137 float16x4_t __rev2_167; __rev2_167 = __builtin_shufflevector(__s2_167, __s2_167, 3, 2, 1, 0); \ 36138 __ret_167 = __noswap_vcmla_rot270_f16(__rev0_167, __rev1_167, __builtin_bit_cast(float16x4_t, (uint32x2_t) {__noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_167), __p3_167), __noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_167), __p3_167)})); \ 36139 __ret_167 = __builtin_shufflevector(__ret_167, __ret_167, 3, 2, 1, 0); \ 36140 __ret_167; \ 36141 }) 36142 #endif 36143 36144 #ifdef __LITTLE_ENDIAN__ 36145 #define vcmlaq_rot270_lane_f16(__p0_168, __p1_168, __p2_168, __p3_168) __extension__ ({ \ 36146 float16x8_t __ret_168; \ 36147 float16x8_t __s0_168 = __p0_168; \ 36148 float16x8_t __s1_168 = __p1_168; \ 36149 float16x4_t __s2_168 = __p2_168; \ 36150 __ret_168 = vcmlaq_rot270_f16(__s0_168, __s1_168, __builtin_bit_cast(float16x8_t, (uint32x4_t) {vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_168), __p3_168), vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_168), __p3_168), vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_168), __p3_168), vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_168), __p3_168)})); \ 36151 __ret_168; \ 36152 }) 36153 #else 36154 #define vcmlaq_rot270_lane_f16(__p0_169, __p1_169, __p2_169, __p3_169) __extension__ ({ \ 36155 float16x8_t __ret_169; \ 36156 float16x8_t __s0_169 = __p0_169; \ 36157 float16x8_t __s1_169 = __p1_169; \ 36158 float16x4_t __s2_169 = __p2_169; \ 36159 float16x8_t __rev0_169; __rev0_169 = __builtin_shufflevector(__s0_169, __s0_169, 7, 6, 5, 4, 3, 2, 1, 0); \ 36160 float16x8_t __rev1_169; __rev1_169 = __builtin_shufflevector(__s1_169, __s1_169, 7, 6, 5, 4, 3, 2, 1, 0); \ 36161 float16x4_t __rev2_169; __rev2_169 = __builtin_shufflevector(__s2_169, __s2_169, 3, 2, 1, 0); \ 36162 __ret_169 = __noswap_vcmlaq_rot270_f16(__rev0_169, __rev1_169, __builtin_bit_cast(float16x8_t, (uint32x4_t) {__noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_169), __p3_169), __noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_169), __p3_169), __noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_169), __p3_169), __noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_169), __p3_169)})); \ 36163 __ret_169 = __builtin_shufflevector(__ret_169, __ret_169, 7, 6, 5, 4, 3, 2, 1, 0); \ 36164 __ret_169; \ 36165 }) 36166 #endif 36167 36168 #ifdef __LITTLE_ENDIAN__ 36169 #define vcmla_rot270_laneq_f16(__p0_170, __p1_170, __p2_170, __p3_170) __extension__ ({ \ 36170 float16x4_t __ret_170; \ 36171 float16x4_t __s0_170 = __p0_170; \ 36172 float16x4_t __s1_170 = __p1_170; \ 36173 float16x8_t __s2_170 = __p2_170; \ 36174 __ret_170 = vcmla_rot270_f16(__s0_170, __s1_170, __builtin_bit_cast(float16x4_t, (uint32x2_t) {vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_170), __p3_170), vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_170), __p3_170)})); \ 36175 __ret_170; \ 36176 }) 36177 #else 36178 #define vcmla_rot270_laneq_f16(__p0_171, __p1_171, __p2_171, __p3_171) __extension__ ({ \ 36179 float16x4_t __ret_171; \ 36180 float16x4_t __s0_171 = __p0_171; \ 36181 float16x4_t __s1_171 = __p1_171; \ 36182 float16x8_t __s2_171 = __p2_171; \ 36183 float16x4_t __rev0_171; __rev0_171 = __builtin_shufflevector(__s0_171, __s0_171, 3, 2, 1, 0); \ 36184 float16x4_t __rev1_171; __rev1_171 = __builtin_shufflevector(__s1_171, __s1_171, 3, 2, 1, 0); \ 36185 float16x8_t __rev2_171; __rev2_171 = __builtin_shufflevector(__s2_171, __s2_171, 7, 6, 5, 4, 3, 2, 1, 0); \ 36186 __ret_171 = __noswap_vcmla_rot270_f16(__rev0_171, __rev1_171, __builtin_bit_cast(float16x4_t, (uint32x2_t) {__noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_171), __p3_171), __noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_171), __p3_171)})); \ 36187 __ret_171 = __builtin_shufflevector(__ret_171, __ret_171, 3, 2, 1, 0); \ 36188 __ret_171; \ 36189 }) 36190 #endif 36191 36192 #ifdef __LITTLE_ENDIAN__ 36193 #define vcmlaq_rot270_laneq_f16(__p0_172, __p1_172, __p2_172, __p3_172) __extension__ ({ \ 36194 float16x8_t __ret_172; \ 36195 float16x8_t __s0_172 = __p0_172; \ 36196 float16x8_t __s1_172 = __p1_172; \ 36197 float16x8_t __s2_172 = __p2_172; \ 36198 __ret_172 = vcmlaq_rot270_f16(__s0_172, __s1_172, __builtin_bit_cast(float16x8_t, (uint32x4_t) {vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_172), __p3_172), vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_172), __p3_172), vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_172), __p3_172), vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_172), __p3_172)})); \ 36199 __ret_172; \ 36200 }) 36201 #else 36202 #define vcmlaq_rot270_laneq_f16(__p0_173, __p1_173, __p2_173, __p3_173) __extension__ ({ \ 36203 float16x8_t __ret_173; \ 36204 float16x8_t __s0_173 = __p0_173; \ 36205 float16x8_t __s1_173 = __p1_173; \ 36206 float16x8_t __s2_173 = __p2_173; \ 36207 float16x8_t __rev0_173; __rev0_173 = __builtin_shufflevector(__s0_173, __s0_173, 7, 6, 5, 4, 3, 2, 1, 0); \ 36208 float16x8_t __rev1_173; __rev1_173 = __builtin_shufflevector(__s1_173, __s1_173, 7, 6, 5, 4, 3, 2, 1, 0); \ 36209 float16x8_t __rev2_173; __rev2_173 = __builtin_shufflevector(__s2_173, __s2_173, 7, 6, 5, 4, 3, 2, 1, 0); \ 36210 __ret_173 = __noswap_vcmlaq_rot270_f16(__rev0_173, __rev1_173, __builtin_bit_cast(float16x8_t, (uint32x4_t) {__noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_173), __p3_173), __noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_173), __p3_173), __noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_173), __p3_173), __noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_173), __p3_173)})); \ 36211 __ret_173 = __builtin_shufflevector(__ret_173, __ret_173, 7, 6, 5, 4, 3, 2, 1, 0); \ 36212 __ret_173; \ 36213 }) 36214 #endif 36215 36216 #ifdef __LITTLE_ENDIAN__ 36217 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x8_t vcmlaq_rot90_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) { 36218 float16x8_t __ret; 36219 __ret = (float16x8_t) __builtin_neon_vcmlaq_rot90_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 40); 36220 return __ret; 36221 } 36222 #else 36223 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x8_t vcmlaq_rot90_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) { 36224 float16x8_t __ret; 36225 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 36226 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 36227 float16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 36228 __ret = (float16x8_t) __builtin_neon_vcmlaq_rot90_f16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 40); 36229 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 36230 return __ret; 36231 } 36232 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x8_t __noswap_vcmlaq_rot90_f16(float16x8_t __p0, float16x8_t __p1, float16x8_t __p2) { 36233 float16x8_t __ret; 36234 __ret = (float16x8_t) __builtin_neon_vcmlaq_rot90_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 40); 36235 return __ret; 36236 } 36237 #endif 36238 36239 #ifdef __LITTLE_ENDIAN__ 36240 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x4_t vcmla_rot90_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) { 36241 float16x4_t __ret; 36242 __ret = (float16x4_t) __builtin_neon_vcmla_rot90_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 8); 36243 return __ret; 36244 } 36245 #else 36246 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x4_t vcmla_rot90_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) { 36247 float16x4_t __ret; 36248 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 36249 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 36250 float16x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 36251 __ret = (float16x4_t) __builtin_neon_vcmla_rot90_f16((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 8); 36252 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 36253 return __ret; 36254 } 36255 __ai __attribute__((target("v8.3a,fullfp16,neon"))) float16x4_t __noswap_vcmla_rot90_f16(float16x4_t __p0, float16x4_t __p1, float16x4_t __p2) { 36256 float16x4_t __ret; 36257 __ret = (float16x4_t) __builtin_neon_vcmla_rot90_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 8); 36258 return __ret; 36259 } 36260 #endif 36261 36262 #ifdef __LITTLE_ENDIAN__ 36263 #define vcmla_rot90_lane_f16(__p0_174, __p1_174, __p2_174, __p3_174) __extension__ ({ \ 36264 float16x4_t __ret_174; \ 36265 float16x4_t __s0_174 = __p0_174; \ 36266 float16x4_t __s1_174 = __p1_174; \ 36267 float16x4_t __s2_174 = __p2_174; \ 36268 __ret_174 = vcmla_rot90_f16(__s0_174, __s1_174, __builtin_bit_cast(float16x4_t, (uint32x2_t) {vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_174), __p3_174), vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_174), __p3_174)})); \ 36269 __ret_174; \ 36270 }) 36271 #else 36272 #define vcmla_rot90_lane_f16(__p0_175, __p1_175, __p2_175, __p3_175) __extension__ ({ \ 36273 float16x4_t __ret_175; \ 36274 float16x4_t __s0_175 = __p0_175; \ 36275 float16x4_t __s1_175 = __p1_175; \ 36276 float16x4_t __s2_175 = __p2_175; \ 36277 float16x4_t __rev0_175; __rev0_175 = __builtin_shufflevector(__s0_175, __s0_175, 3, 2, 1, 0); \ 36278 float16x4_t __rev1_175; __rev1_175 = __builtin_shufflevector(__s1_175, __s1_175, 3, 2, 1, 0); \ 36279 float16x4_t __rev2_175; __rev2_175 = __builtin_shufflevector(__s2_175, __s2_175, 3, 2, 1, 0); \ 36280 __ret_175 = __noswap_vcmla_rot90_f16(__rev0_175, __rev1_175, __builtin_bit_cast(float16x4_t, (uint32x2_t) {__noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_175), __p3_175), __noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_175), __p3_175)})); \ 36281 __ret_175 = __builtin_shufflevector(__ret_175, __ret_175, 3, 2, 1, 0); \ 36282 __ret_175; \ 36283 }) 36284 #endif 36285 36286 #ifdef __LITTLE_ENDIAN__ 36287 #define vcmlaq_rot90_lane_f16(__p0_176, __p1_176, __p2_176, __p3_176) __extension__ ({ \ 36288 float16x8_t __ret_176; \ 36289 float16x8_t __s0_176 = __p0_176; \ 36290 float16x8_t __s1_176 = __p1_176; \ 36291 float16x4_t __s2_176 = __p2_176; \ 36292 __ret_176 = vcmlaq_rot90_f16(__s0_176, __s1_176, __builtin_bit_cast(float16x8_t, (uint32x4_t) {vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_176), __p3_176), vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_176), __p3_176), vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_176), __p3_176), vget_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_176), __p3_176)})); \ 36293 __ret_176; \ 36294 }) 36295 #else 36296 #define vcmlaq_rot90_lane_f16(__p0_177, __p1_177, __p2_177, __p3_177) __extension__ ({ \ 36297 float16x8_t __ret_177; \ 36298 float16x8_t __s0_177 = __p0_177; \ 36299 float16x8_t __s1_177 = __p1_177; \ 36300 float16x4_t __s2_177 = __p2_177; \ 36301 float16x8_t __rev0_177; __rev0_177 = __builtin_shufflevector(__s0_177, __s0_177, 7, 6, 5, 4, 3, 2, 1, 0); \ 36302 float16x8_t __rev1_177; __rev1_177 = __builtin_shufflevector(__s1_177, __s1_177, 7, 6, 5, 4, 3, 2, 1, 0); \ 36303 float16x4_t __rev2_177; __rev2_177 = __builtin_shufflevector(__s2_177, __s2_177, 3, 2, 1, 0); \ 36304 __ret_177 = __noswap_vcmlaq_rot90_f16(__rev0_177, __rev1_177, __builtin_bit_cast(float16x8_t, (uint32x4_t) {__noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_177), __p3_177), __noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_177), __p3_177), __noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_177), __p3_177), __noswap_vget_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_177), __p3_177)})); \ 36305 __ret_177 = __builtin_shufflevector(__ret_177, __ret_177, 7, 6, 5, 4, 3, 2, 1, 0); \ 36306 __ret_177; \ 36307 }) 36308 #endif 36309 36310 #ifdef __LITTLE_ENDIAN__ 36311 #define vcmla_rot90_laneq_f16(__p0_178, __p1_178, __p2_178, __p3_178) __extension__ ({ \ 36312 float16x4_t __ret_178; \ 36313 float16x4_t __s0_178 = __p0_178; \ 36314 float16x4_t __s1_178 = __p1_178; \ 36315 float16x8_t __s2_178 = __p2_178; \ 36316 __ret_178 = vcmla_rot90_f16(__s0_178, __s1_178, __builtin_bit_cast(float16x4_t, (uint32x2_t) {vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_178), __p3_178), vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_178), __p3_178)})); \ 36317 __ret_178; \ 36318 }) 36319 #else 36320 #define vcmla_rot90_laneq_f16(__p0_179, __p1_179, __p2_179, __p3_179) __extension__ ({ \ 36321 float16x4_t __ret_179; \ 36322 float16x4_t __s0_179 = __p0_179; \ 36323 float16x4_t __s1_179 = __p1_179; \ 36324 float16x8_t __s2_179 = __p2_179; \ 36325 float16x4_t __rev0_179; __rev0_179 = __builtin_shufflevector(__s0_179, __s0_179, 3, 2, 1, 0); \ 36326 float16x4_t __rev1_179; __rev1_179 = __builtin_shufflevector(__s1_179, __s1_179, 3, 2, 1, 0); \ 36327 float16x8_t __rev2_179; __rev2_179 = __builtin_shufflevector(__s2_179, __s2_179, 7, 6, 5, 4, 3, 2, 1, 0); \ 36328 __ret_179 = __noswap_vcmla_rot90_f16(__rev0_179, __rev1_179, __builtin_bit_cast(float16x4_t, (uint32x2_t) {__noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_179), __p3_179), __noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_179), __p3_179)})); \ 36329 __ret_179 = __builtin_shufflevector(__ret_179, __ret_179, 3, 2, 1, 0); \ 36330 __ret_179; \ 36331 }) 36332 #endif 36333 36334 #ifdef __LITTLE_ENDIAN__ 36335 #define vcmlaq_rot90_laneq_f16(__p0_180, __p1_180, __p2_180, __p3_180) __extension__ ({ \ 36336 float16x8_t __ret_180; \ 36337 float16x8_t __s0_180 = __p0_180; \ 36338 float16x8_t __s1_180 = __p1_180; \ 36339 float16x8_t __s2_180 = __p2_180; \ 36340 __ret_180 = vcmlaq_rot90_f16(__s0_180, __s1_180, __builtin_bit_cast(float16x8_t, (uint32x4_t) {vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_180), __p3_180), vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_180), __p3_180), vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_180), __p3_180), vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __s2_180), __p3_180)})); \ 36341 __ret_180; \ 36342 }) 36343 #else 36344 #define vcmlaq_rot90_laneq_f16(__p0_181, __p1_181, __p2_181, __p3_181) __extension__ ({ \ 36345 float16x8_t __ret_181; \ 36346 float16x8_t __s0_181 = __p0_181; \ 36347 float16x8_t __s1_181 = __p1_181; \ 36348 float16x8_t __s2_181 = __p2_181; \ 36349 float16x8_t __rev0_181; __rev0_181 = __builtin_shufflevector(__s0_181, __s0_181, 7, 6, 5, 4, 3, 2, 1, 0); \ 36350 float16x8_t __rev1_181; __rev1_181 = __builtin_shufflevector(__s1_181, __s1_181, 7, 6, 5, 4, 3, 2, 1, 0); \ 36351 float16x8_t __rev2_181; __rev2_181 = __builtin_shufflevector(__s2_181, __s2_181, 7, 6, 5, 4, 3, 2, 1, 0); \ 36352 __ret_181 = __noswap_vcmlaq_rot90_f16(__rev0_181, __rev1_181, __builtin_bit_cast(float16x8_t, (uint32x4_t) {__noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_181), __p3_181), __noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_181), __p3_181), __noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_181), __p3_181), __noswap_vgetq_lane_u32(__builtin_bit_cast(uint32x4_t, __rev2_181), __p3_181)})); \ 36353 __ret_181 = __builtin_shufflevector(__ret_181, __ret_181, 7, 6, 5, 4, 3, 2, 1, 0); \ 36354 __ret_181; \ 36355 }) 36356 #endif 36357 36358 #ifdef __LITTLE_ENDIAN__ 36359 __ai __attribute__((target("v8.3a,neon"))) float32x2_t vcadd_rot270_f32(float32x2_t __p0, float32x2_t __p1) { 36360 float32x2_t __ret; 36361 __ret = (float32x2_t) __builtin_neon_vcadd_rot270_f32((int8x8_t)__p0, (int8x8_t)__p1, 9); 36362 return __ret; 36363 } 36364 #else 36365 __ai __attribute__((target("v8.3a,neon"))) float32x2_t vcadd_rot270_f32(float32x2_t __p0, float32x2_t __p1) { 36366 float32x2_t __ret; 36367 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 36368 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 36369 __ret = (float32x2_t) __builtin_neon_vcadd_rot270_f32((int8x8_t)__rev0, (int8x8_t)__rev1, 9); 36370 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 36371 return __ret; 36372 } 36373 #endif 36374 36375 #ifdef __LITTLE_ENDIAN__ 36376 __ai __attribute__((target("v8.3a,neon"))) float32x2_t vcadd_rot90_f32(float32x2_t __p0, float32x2_t __p1) { 36377 float32x2_t __ret; 36378 __ret = (float32x2_t) __builtin_neon_vcadd_rot90_f32((int8x8_t)__p0, (int8x8_t)__p1, 9); 36379 return __ret; 36380 } 36381 #else 36382 __ai __attribute__((target("v8.3a,neon"))) float32x2_t vcadd_rot90_f32(float32x2_t __p0, float32x2_t __p1) { 36383 float32x2_t __ret; 36384 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 36385 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 36386 __ret = (float32x2_t) __builtin_neon_vcadd_rot90_f32((int8x8_t)__rev0, (int8x8_t)__rev1, 9); 36387 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 36388 return __ret; 36389 } 36390 #endif 36391 36392 #ifdef __LITTLE_ENDIAN__ 36393 __ai __attribute__((target("v8.3a,neon"))) float32x4_t vcaddq_rot270_f32(float32x4_t __p0, float32x4_t __p1) { 36394 float32x4_t __ret; 36395 __ret = (float32x4_t) __builtin_neon_vcaddq_rot270_f32((int8x16_t)__p0, (int8x16_t)__p1, 41); 36396 return __ret; 36397 } 36398 #else 36399 __ai __attribute__((target("v8.3a,neon"))) float32x4_t vcaddq_rot270_f32(float32x4_t __p0, float32x4_t __p1) { 36400 float32x4_t __ret; 36401 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 36402 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 36403 __ret = (float32x4_t) __builtin_neon_vcaddq_rot270_f32((int8x16_t)__rev0, (int8x16_t)__rev1, 41); 36404 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 36405 return __ret; 36406 } 36407 #endif 36408 36409 #ifdef __LITTLE_ENDIAN__ 36410 __ai __attribute__((target("v8.3a,neon"))) float32x4_t vcaddq_rot90_f32(float32x4_t __p0, float32x4_t __p1) { 36411 float32x4_t __ret; 36412 __ret = (float32x4_t) __builtin_neon_vcaddq_rot90_f32((int8x16_t)__p0, (int8x16_t)__p1, 41); 36413 return __ret; 36414 } 36415 #else 36416 __ai __attribute__((target("v8.3a,neon"))) float32x4_t vcaddq_rot90_f32(float32x4_t __p0, float32x4_t __p1) { 36417 float32x4_t __ret; 36418 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 36419 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 36420 __ret = (float32x4_t) __builtin_neon_vcaddq_rot90_f32((int8x16_t)__rev0, (int8x16_t)__rev1, 41); 36421 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 36422 return __ret; 36423 } 36424 #endif 36425 36426 #ifdef __LITTLE_ENDIAN__ 36427 __ai __attribute__((target("v8.3a,neon"))) float32x4_t vcmlaq_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) { 36428 float32x4_t __ret; 36429 __ret = (float32x4_t) __builtin_neon_vcmlaq_f32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41); 36430 return __ret; 36431 } 36432 #else 36433 __ai __attribute__((target("v8.3a,neon"))) float32x4_t vcmlaq_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) { 36434 float32x4_t __ret; 36435 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 36436 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 36437 float32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 36438 __ret = (float32x4_t) __builtin_neon_vcmlaq_f32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 41); 36439 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 36440 return __ret; 36441 } 36442 __ai __attribute__((target("v8.3a,neon"))) float32x4_t __noswap_vcmlaq_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) { 36443 float32x4_t __ret; 36444 __ret = (float32x4_t) __builtin_neon_vcmlaq_f32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41); 36445 return __ret; 36446 } 36447 #endif 36448 36449 #ifdef __LITTLE_ENDIAN__ 36450 __ai __attribute__((target("v8.3a,neon"))) float32x2_t vcmla_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) { 36451 float32x2_t __ret; 36452 __ret = (float32x2_t) __builtin_neon_vcmla_f32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9); 36453 return __ret; 36454 } 36455 #else 36456 __ai __attribute__((target("v8.3a,neon"))) float32x2_t vcmla_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) { 36457 float32x2_t __ret; 36458 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 36459 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 36460 float32x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 36461 __ret = (float32x2_t) __builtin_neon_vcmla_f32((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 9); 36462 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 36463 return __ret; 36464 } 36465 __ai __attribute__((target("v8.3a,neon"))) float32x2_t __noswap_vcmla_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) { 36466 float32x2_t __ret; 36467 __ret = (float32x2_t) __builtin_neon_vcmla_f32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9); 36468 return __ret; 36469 } 36470 #endif 36471 36472 #ifdef __LITTLE_ENDIAN__ 36473 #define vcmla_lane_f32(__p0_182, __p1_182, __p2_182, __p3_182) __extension__ ({ \ 36474 float32x2_t __ret_182; \ 36475 float32x2_t __s0_182 = __p0_182; \ 36476 float32x2_t __s1_182 = __p1_182; \ 36477 float32x2_t __s2_182 = __p2_182; \ 36478 __ret_182 = vcmla_f32(__s0_182, __s1_182, __builtin_bit_cast(float32x2_t, (uint64x1_t) {vget_lane_u64(__builtin_bit_cast(uint64x1_t, __s2_182), __p3_182)})); \ 36479 __ret_182; \ 36480 }) 36481 #else 36482 #define vcmla_lane_f32(__p0_183, __p1_183, __p2_183, __p3_183) __extension__ ({ \ 36483 float32x2_t __ret_183; \ 36484 float32x2_t __s0_183 = __p0_183; \ 36485 float32x2_t __s1_183 = __p1_183; \ 36486 float32x2_t __s2_183 = __p2_183; \ 36487 float32x2_t __rev0_183; __rev0_183 = __builtin_shufflevector(__s0_183, __s0_183, 1, 0); \ 36488 float32x2_t __rev1_183; __rev1_183 = __builtin_shufflevector(__s1_183, __s1_183, 1, 0); \ 36489 float32x2_t __rev2_183; __rev2_183 = __builtin_shufflevector(__s2_183, __s2_183, 1, 0); \ 36490 __ret_183 = __noswap_vcmla_f32(__rev0_183, __rev1_183, __builtin_bit_cast(float32x2_t, (uint64x1_t) {vget_lane_u64(__builtin_bit_cast(uint64x1_t, __rev2_183), __p3_183)})); \ 36491 __ret_183 = __builtin_shufflevector(__ret_183, __ret_183, 1, 0); \ 36492 __ret_183; \ 36493 }) 36494 #endif 36495 36496 #ifdef __LITTLE_ENDIAN__ 36497 #define vcmlaq_lane_f32(__p0_184, __p1_184, __p2_184, __p3_184) __extension__ ({ \ 36498 float32x4_t __ret_184; \ 36499 float32x4_t __s0_184 = __p0_184; \ 36500 float32x4_t __s1_184 = __p1_184; \ 36501 float32x2_t __s2_184 = __p2_184; \ 36502 __ret_184 = vcmlaq_f32(__s0_184, __s1_184, __builtin_bit_cast(float32x4_t, (uint64x2_t) {vget_lane_u64(__builtin_bit_cast(uint64x1_t, __s2_184), __p3_184), vget_lane_u64(__builtin_bit_cast(uint64x1_t, __s2_184), __p3_184)})); \ 36503 __ret_184; \ 36504 }) 36505 #else 36506 #define vcmlaq_lane_f32(__p0_185, __p1_185, __p2_185, __p3_185) __extension__ ({ \ 36507 float32x4_t __ret_185; \ 36508 float32x4_t __s0_185 = __p0_185; \ 36509 float32x4_t __s1_185 = __p1_185; \ 36510 float32x2_t __s2_185 = __p2_185; \ 36511 float32x4_t __rev0_185; __rev0_185 = __builtin_shufflevector(__s0_185, __s0_185, 3, 2, 1, 0); \ 36512 float32x4_t __rev1_185; __rev1_185 = __builtin_shufflevector(__s1_185, __s1_185, 3, 2, 1, 0); \ 36513 float32x2_t __rev2_185; __rev2_185 = __builtin_shufflevector(__s2_185, __s2_185, 1, 0); \ 36514 __ret_185 = __noswap_vcmlaq_f32(__rev0_185, __rev1_185, __builtin_bit_cast(float32x4_t, (uint64x2_t) {vget_lane_u64(__builtin_bit_cast(uint64x1_t, __rev2_185), __p3_185), vget_lane_u64(__builtin_bit_cast(uint64x1_t, __rev2_185), __p3_185)})); \ 36515 __ret_185 = __builtin_shufflevector(__ret_185, __ret_185, 3, 2, 1, 0); \ 36516 __ret_185; \ 36517 }) 36518 #endif 36519 36520 #ifdef __LITTLE_ENDIAN__ 36521 #define vcmla_laneq_f32(__p0_186, __p1_186, __p2_186, __p3_186) __extension__ ({ \ 36522 float32x2_t __ret_186; \ 36523 float32x2_t __s0_186 = __p0_186; \ 36524 float32x2_t __s1_186 = __p1_186; \ 36525 float32x4_t __s2_186 = __p2_186; \ 36526 __ret_186 = vcmla_f32(__s0_186, __s1_186, __builtin_bit_cast(float32x2_t, (uint64x1_t) {vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __s2_186), __p3_186)})); \ 36527 __ret_186; \ 36528 }) 36529 #else 36530 #define vcmla_laneq_f32(__p0_187, __p1_187, __p2_187, __p3_187) __extension__ ({ \ 36531 float32x2_t __ret_187; \ 36532 float32x2_t __s0_187 = __p0_187; \ 36533 float32x2_t __s1_187 = __p1_187; \ 36534 float32x4_t __s2_187 = __p2_187; \ 36535 float32x2_t __rev0_187; __rev0_187 = __builtin_shufflevector(__s0_187, __s0_187, 1, 0); \ 36536 float32x2_t __rev1_187; __rev1_187 = __builtin_shufflevector(__s1_187, __s1_187, 1, 0); \ 36537 float32x4_t __rev2_187; __rev2_187 = __builtin_shufflevector(__s2_187, __s2_187, 3, 2, 1, 0); \ 36538 __ret_187 = __noswap_vcmla_f32(__rev0_187, __rev1_187, __builtin_bit_cast(float32x2_t, (uint64x1_t) {__noswap_vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __rev2_187), __p3_187)})); \ 36539 __ret_187 = __builtin_shufflevector(__ret_187, __ret_187, 1, 0); \ 36540 __ret_187; \ 36541 }) 36542 #endif 36543 36544 #ifdef __LITTLE_ENDIAN__ 36545 #define vcmlaq_laneq_f32(__p0_188, __p1_188, __p2_188, __p3_188) __extension__ ({ \ 36546 float32x4_t __ret_188; \ 36547 float32x4_t __s0_188 = __p0_188; \ 36548 float32x4_t __s1_188 = __p1_188; \ 36549 float32x4_t __s2_188 = __p2_188; \ 36550 __ret_188 = vcmlaq_f32(__s0_188, __s1_188, __builtin_bit_cast(float32x4_t, (uint64x2_t) {vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __s2_188), __p3_188), vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __s2_188), __p3_188)})); \ 36551 __ret_188; \ 36552 }) 36553 #else 36554 #define vcmlaq_laneq_f32(__p0_189, __p1_189, __p2_189, __p3_189) __extension__ ({ \ 36555 float32x4_t __ret_189; \ 36556 float32x4_t __s0_189 = __p0_189; \ 36557 float32x4_t __s1_189 = __p1_189; \ 36558 float32x4_t __s2_189 = __p2_189; \ 36559 float32x4_t __rev0_189; __rev0_189 = __builtin_shufflevector(__s0_189, __s0_189, 3, 2, 1, 0); \ 36560 float32x4_t __rev1_189; __rev1_189 = __builtin_shufflevector(__s1_189, __s1_189, 3, 2, 1, 0); \ 36561 float32x4_t __rev2_189; __rev2_189 = __builtin_shufflevector(__s2_189, __s2_189, 3, 2, 1, 0); \ 36562 __ret_189 = __noswap_vcmlaq_f32(__rev0_189, __rev1_189, __builtin_bit_cast(float32x4_t, (uint64x2_t) {__noswap_vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __rev2_189), __p3_189), __noswap_vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __rev2_189), __p3_189)})); \ 36563 __ret_189 = __builtin_shufflevector(__ret_189, __ret_189, 3, 2, 1, 0); \ 36564 __ret_189; \ 36565 }) 36566 #endif 36567 36568 #ifdef __LITTLE_ENDIAN__ 36569 __ai __attribute__((target("v8.3a,neon"))) float32x4_t vcmlaq_rot180_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) { 36570 float32x4_t __ret; 36571 __ret = (float32x4_t) __builtin_neon_vcmlaq_rot180_f32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41); 36572 return __ret; 36573 } 36574 #else 36575 __ai __attribute__((target("v8.3a,neon"))) float32x4_t vcmlaq_rot180_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) { 36576 float32x4_t __ret; 36577 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 36578 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 36579 float32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 36580 __ret = (float32x4_t) __builtin_neon_vcmlaq_rot180_f32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 41); 36581 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 36582 return __ret; 36583 } 36584 __ai __attribute__((target("v8.3a,neon"))) float32x4_t __noswap_vcmlaq_rot180_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) { 36585 float32x4_t __ret; 36586 __ret = (float32x4_t) __builtin_neon_vcmlaq_rot180_f32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41); 36587 return __ret; 36588 } 36589 #endif 36590 36591 #ifdef __LITTLE_ENDIAN__ 36592 __ai __attribute__((target("v8.3a,neon"))) float32x2_t vcmla_rot180_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) { 36593 float32x2_t __ret; 36594 __ret = (float32x2_t) __builtin_neon_vcmla_rot180_f32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9); 36595 return __ret; 36596 } 36597 #else 36598 __ai __attribute__((target("v8.3a,neon"))) float32x2_t vcmla_rot180_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) { 36599 float32x2_t __ret; 36600 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 36601 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 36602 float32x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 36603 __ret = (float32x2_t) __builtin_neon_vcmla_rot180_f32((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 9); 36604 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 36605 return __ret; 36606 } 36607 __ai __attribute__((target("v8.3a,neon"))) float32x2_t __noswap_vcmla_rot180_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) { 36608 float32x2_t __ret; 36609 __ret = (float32x2_t) __builtin_neon_vcmla_rot180_f32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9); 36610 return __ret; 36611 } 36612 #endif 36613 36614 #ifdef __LITTLE_ENDIAN__ 36615 #define vcmla_rot180_lane_f32(__p0_190, __p1_190, __p2_190, __p3_190) __extension__ ({ \ 36616 float32x2_t __ret_190; \ 36617 float32x2_t __s0_190 = __p0_190; \ 36618 float32x2_t __s1_190 = __p1_190; \ 36619 float32x2_t __s2_190 = __p2_190; \ 36620 __ret_190 = vcmla_rot180_f32(__s0_190, __s1_190, __builtin_bit_cast(float32x2_t, (uint64x1_t) {vget_lane_u64(__builtin_bit_cast(uint64x1_t, __s2_190), __p3_190)})); \ 36621 __ret_190; \ 36622 }) 36623 #else 36624 #define vcmla_rot180_lane_f32(__p0_191, __p1_191, __p2_191, __p3_191) __extension__ ({ \ 36625 float32x2_t __ret_191; \ 36626 float32x2_t __s0_191 = __p0_191; \ 36627 float32x2_t __s1_191 = __p1_191; \ 36628 float32x2_t __s2_191 = __p2_191; \ 36629 float32x2_t __rev0_191; __rev0_191 = __builtin_shufflevector(__s0_191, __s0_191, 1, 0); \ 36630 float32x2_t __rev1_191; __rev1_191 = __builtin_shufflevector(__s1_191, __s1_191, 1, 0); \ 36631 float32x2_t __rev2_191; __rev2_191 = __builtin_shufflevector(__s2_191, __s2_191, 1, 0); \ 36632 __ret_191 = __noswap_vcmla_rot180_f32(__rev0_191, __rev1_191, __builtin_bit_cast(float32x2_t, (uint64x1_t) {vget_lane_u64(__builtin_bit_cast(uint64x1_t, __rev2_191), __p3_191)})); \ 36633 __ret_191 = __builtin_shufflevector(__ret_191, __ret_191, 1, 0); \ 36634 __ret_191; \ 36635 }) 36636 #endif 36637 36638 #ifdef __LITTLE_ENDIAN__ 36639 #define vcmlaq_rot180_lane_f32(__p0_192, __p1_192, __p2_192, __p3_192) __extension__ ({ \ 36640 float32x4_t __ret_192; \ 36641 float32x4_t __s0_192 = __p0_192; \ 36642 float32x4_t __s1_192 = __p1_192; \ 36643 float32x2_t __s2_192 = __p2_192; \ 36644 __ret_192 = vcmlaq_rot180_f32(__s0_192, __s1_192, __builtin_bit_cast(float32x4_t, (uint64x2_t) {vget_lane_u64(__builtin_bit_cast(uint64x1_t, __s2_192), __p3_192), vget_lane_u64(__builtin_bit_cast(uint64x1_t, __s2_192), __p3_192)})); \ 36645 __ret_192; \ 36646 }) 36647 #else 36648 #define vcmlaq_rot180_lane_f32(__p0_193, __p1_193, __p2_193, __p3_193) __extension__ ({ \ 36649 float32x4_t __ret_193; \ 36650 float32x4_t __s0_193 = __p0_193; \ 36651 float32x4_t __s1_193 = __p1_193; \ 36652 float32x2_t __s2_193 = __p2_193; \ 36653 float32x4_t __rev0_193; __rev0_193 = __builtin_shufflevector(__s0_193, __s0_193, 3, 2, 1, 0); \ 36654 float32x4_t __rev1_193; __rev1_193 = __builtin_shufflevector(__s1_193, __s1_193, 3, 2, 1, 0); \ 36655 float32x2_t __rev2_193; __rev2_193 = __builtin_shufflevector(__s2_193, __s2_193, 1, 0); \ 36656 __ret_193 = __noswap_vcmlaq_rot180_f32(__rev0_193, __rev1_193, __builtin_bit_cast(float32x4_t, (uint64x2_t) {vget_lane_u64(__builtin_bit_cast(uint64x1_t, __rev2_193), __p3_193), vget_lane_u64(__builtin_bit_cast(uint64x1_t, __rev2_193), __p3_193)})); \ 36657 __ret_193 = __builtin_shufflevector(__ret_193, __ret_193, 3, 2, 1, 0); \ 36658 __ret_193; \ 36659 }) 36660 #endif 36661 36662 #ifdef __LITTLE_ENDIAN__ 36663 #define vcmla_rot180_laneq_f32(__p0_194, __p1_194, __p2_194, __p3_194) __extension__ ({ \ 36664 float32x2_t __ret_194; \ 36665 float32x2_t __s0_194 = __p0_194; \ 36666 float32x2_t __s1_194 = __p1_194; \ 36667 float32x4_t __s2_194 = __p2_194; \ 36668 __ret_194 = vcmla_rot180_f32(__s0_194, __s1_194, __builtin_bit_cast(float32x2_t, (uint64x1_t) {vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __s2_194), __p3_194)})); \ 36669 __ret_194; \ 36670 }) 36671 #else 36672 #define vcmla_rot180_laneq_f32(__p0_195, __p1_195, __p2_195, __p3_195) __extension__ ({ \ 36673 float32x2_t __ret_195; \ 36674 float32x2_t __s0_195 = __p0_195; \ 36675 float32x2_t __s1_195 = __p1_195; \ 36676 float32x4_t __s2_195 = __p2_195; \ 36677 float32x2_t __rev0_195; __rev0_195 = __builtin_shufflevector(__s0_195, __s0_195, 1, 0); \ 36678 float32x2_t __rev1_195; __rev1_195 = __builtin_shufflevector(__s1_195, __s1_195, 1, 0); \ 36679 float32x4_t __rev2_195; __rev2_195 = __builtin_shufflevector(__s2_195, __s2_195, 3, 2, 1, 0); \ 36680 __ret_195 = __noswap_vcmla_rot180_f32(__rev0_195, __rev1_195, __builtin_bit_cast(float32x2_t, (uint64x1_t) {__noswap_vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __rev2_195), __p3_195)})); \ 36681 __ret_195 = __builtin_shufflevector(__ret_195, __ret_195, 1, 0); \ 36682 __ret_195; \ 36683 }) 36684 #endif 36685 36686 #ifdef __LITTLE_ENDIAN__ 36687 #define vcmlaq_rot180_laneq_f32(__p0_196, __p1_196, __p2_196, __p3_196) __extension__ ({ \ 36688 float32x4_t __ret_196; \ 36689 float32x4_t __s0_196 = __p0_196; \ 36690 float32x4_t __s1_196 = __p1_196; \ 36691 float32x4_t __s2_196 = __p2_196; \ 36692 __ret_196 = vcmlaq_rot180_f32(__s0_196, __s1_196, __builtin_bit_cast(float32x4_t, (uint64x2_t) {vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __s2_196), __p3_196), vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __s2_196), __p3_196)})); \ 36693 __ret_196; \ 36694 }) 36695 #else 36696 #define vcmlaq_rot180_laneq_f32(__p0_197, __p1_197, __p2_197, __p3_197) __extension__ ({ \ 36697 float32x4_t __ret_197; \ 36698 float32x4_t __s0_197 = __p0_197; \ 36699 float32x4_t __s1_197 = __p1_197; \ 36700 float32x4_t __s2_197 = __p2_197; \ 36701 float32x4_t __rev0_197; __rev0_197 = __builtin_shufflevector(__s0_197, __s0_197, 3, 2, 1, 0); \ 36702 float32x4_t __rev1_197; __rev1_197 = __builtin_shufflevector(__s1_197, __s1_197, 3, 2, 1, 0); \ 36703 float32x4_t __rev2_197; __rev2_197 = __builtin_shufflevector(__s2_197, __s2_197, 3, 2, 1, 0); \ 36704 __ret_197 = __noswap_vcmlaq_rot180_f32(__rev0_197, __rev1_197, __builtin_bit_cast(float32x4_t, (uint64x2_t) {__noswap_vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __rev2_197), __p3_197), __noswap_vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __rev2_197), __p3_197)})); \ 36705 __ret_197 = __builtin_shufflevector(__ret_197, __ret_197, 3, 2, 1, 0); \ 36706 __ret_197; \ 36707 }) 36708 #endif 36709 36710 #ifdef __LITTLE_ENDIAN__ 36711 __ai __attribute__((target("v8.3a,neon"))) float32x4_t vcmlaq_rot270_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) { 36712 float32x4_t __ret; 36713 __ret = (float32x4_t) __builtin_neon_vcmlaq_rot270_f32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41); 36714 return __ret; 36715 } 36716 #else 36717 __ai __attribute__((target("v8.3a,neon"))) float32x4_t vcmlaq_rot270_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) { 36718 float32x4_t __ret; 36719 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 36720 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 36721 float32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 36722 __ret = (float32x4_t) __builtin_neon_vcmlaq_rot270_f32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 41); 36723 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 36724 return __ret; 36725 } 36726 __ai __attribute__((target("v8.3a,neon"))) float32x4_t __noswap_vcmlaq_rot270_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) { 36727 float32x4_t __ret; 36728 __ret = (float32x4_t) __builtin_neon_vcmlaq_rot270_f32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41); 36729 return __ret; 36730 } 36731 #endif 36732 36733 #ifdef __LITTLE_ENDIAN__ 36734 __ai __attribute__((target("v8.3a,neon"))) float32x2_t vcmla_rot270_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) { 36735 float32x2_t __ret; 36736 __ret = (float32x2_t) __builtin_neon_vcmla_rot270_f32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9); 36737 return __ret; 36738 } 36739 #else 36740 __ai __attribute__((target("v8.3a,neon"))) float32x2_t vcmla_rot270_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) { 36741 float32x2_t __ret; 36742 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 36743 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 36744 float32x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 36745 __ret = (float32x2_t) __builtin_neon_vcmla_rot270_f32((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 9); 36746 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 36747 return __ret; 36748 } 36749 __ai __attribute__((target("v8.3a,neon"))) float32x2_t __noswap_vcmla_rot270_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) { 36750 float32x2_t __ret; 36751 __ret = (float32x2_t) __builtin_neon_vcmla_rot270_f32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9); 36752 return __ret; 36753 } 36754 #endif 36755 36756 #ifdef __LITTLE_ENDIAN__ 36757 #define vcmla_rot270_lane_f32(__p0_198, __p1_198, __p2_198, __p3_198) __extension__ ({ \ 36758 float32x2_t __ret_198; \ 36759 float32x2_t __s0_198 = __p0_198; \ 36760 float32x2_t __s1_198 = __p1_198; \ 36761 float32x2_t __s2_198 = __p2_198; \ 36762 __ret_198 = vcmla_rot270_f32(__s0_198, __s1_198, __builtin_bit_cast(float32x2_t, (uint64x1_t) {vget_lane_u64(__builtin_bit_cast(uint64x1_t, __s2_198), __p3_198)})); \ 36763 __ret_198; \ 36764 }) 36765 #else 36766 #define vcmla_rot270_lane_f32(__p0_199, __p1_199, __p2_199, __p3_199) __extension__ ({ \ 36767 float32x2_t __ret_199; \ 36768 float32x2_t __s0_199 = __p0_199; \ 36769 float32x2_t __s1_199 = __p1_199; \ 36770 float32x2_t __s2_199 = __p2_199; \ 36771 float32x2_t __rev0_199; __rev0_199 = __builtin_shufflevector(__s0_199, __s0_199, 1, 0); \ 36772 float32x2_t __rev1_199; __rev1_199 = __builtin_shufflevector(__s1_199, __s1_199, 1, 0); \ 36773 float32x2_t __rev2_199; __rev2_199 = __builtin_shufflevector(__s2_199, __s2_199, 1, 0); \ 36774 __ret_199 = __noswap_vcmla_rot270_f32(__rev0_199, __rev1_199, __builtin_bit_cast(float32x2_t, (uint64x1_t) {vget_lane_u64(__builtin_bit_cast(uint64x1_t, __rev2_199), __p3_199)})); \ 36775 __ret_199 = __builtin_shufflevector(__ret_199, __ret_199, 1, 0); \ 36776 __ret_199; \ 36777 }) 36778 #endif 36779 36780 #ifdef __LITTLE_ENDIAN__ 36781 #define vcmlaq_rot270_lane_f32(__p0_200, __p1_200, __p2_200, __p3_200) __extension__ ({ \ 36782 float32x4_t __ret_200; \ 36783 float32x4_t __s0_200 = __p0_200; \ 36784 float32x4_t __s1_200 = __p1_200; \ 36785 float32x2_t __s2_200 = __p2_200; \ 36786 __ret_200 = vcmlaq_rot270_f32(__s0_200, __s1_200, __builtin_bit_cast(float32x4_t, (uint64x2_t) {vget_lane_u64(__builtin_bit_cast(uint64x1_t, __s2_200), __p3_200), vget_lane_u64(__builtin_bit_cast(uint64x1_t, __s2_200), __p3_200)})); \ 36787 __ret_200; \ 36788 }) 36789 #else 36790 #define vcmlaq_rot270_lane_f32(__p0_201, __p1_201, __p2_201, __p3_201) __extension__ ({ \ 36791 float32x4_t __ret_201; \ 36792 float32x4_t __s0_201 = __p0_201; \ 36793 float32x4_t __s1_201 = __p1_201; \ 36794 float32x2_t __s2_201 = __p2_201; \ 36795 float32x4_t __rev0_201; __rev0_201 = __builtin_shufflevector(__s0_201, __s0_201, 3, 2, 1, 0); \ 36796 float32x4_t __rev1_201; __rev1_201 = __builtin_shufflevector(__s1_201, __s1_201, 3, 2, 1, 0); \ 36797 float32x2_t __rev2_201; __rev2_201 = __builtin_shufflevector(__s2_201, __s2_201, 1, 0); \ 36798 __ret_201 = __noswap_vcmlaq_rot270_f32(__rev0_201, __rev1_201, __builtin_bit_cast(float32x4_t, (uint64x2_t) {vget_lane_u64(__builtin_bit_cast(uint64x1_t, __rev2_201), __p3_201), vget_lane_u64(__builtin_bit_cast(uint64x1_t, __rev2_201), __p3_201)})); \ 36799 __ret_201 = __builtin_shufflevector(__ret_201, __ret_201, 3, 2, 1, 0); \ 36800 __ret_201; \ 36801 }) 36802 #endif 36803 36804 #ifdef __LITTLE_ENDIAN__ 36805 #define vcmla_rot270_laneq_f32(__p0_202, __p1_202, __p2_202, __p3_202) __extension__ ({ \ 36806 float32x2_t __ret_202; \ 36807 float32x2_t __s0_202 = __p0_202; \ 36808 float32x2_t __s1_202 = __p1_202; \ 36809 float32x4_t __s2_202 = __p2_202; \ 36810 __ret_202 = vcmla_rot270_f32(__s0_202, __s1_202, __builtin_bit_cast(float32x2_t, (uint64x1_t) {vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __s2_202), __p3_202)})); \ 36811 __ret_202; \ 36812 }) 36813 #else 36814 #define vcmla_rot270_laneq_f32(__p0_203, __p1_203, __p2_203, __p3_203) __extension__ ({ \ 36815 float32x2_t __ret_203; \ 36816 float32x2_t __s0_203 = __p0_203; \ 36817 float32x2_t __s1_203 = __p1_203; \ 36818 float32x4_t __s2_203 = __p2_203; \ 36819 float32x2_t __rev0_203; __rev0_203 = __builtin_shufflevector(__s0_203, __s0_203, 1, 0); \ 36820 float32x2_t __rev1_203; __rev1_203 = __builtin_shufflevector(__s1_203, __s1_203, 1, 0); \ 36821 float32x4_t __rev2_203; __rev2_203 = __builtin_shufflevector(__s2_203, __s2_203, 3, 2, 1, 0); \ 36822 __ret_203 = __noswap_vcmla_rot270_f32(__rev0_203, __rev1_203, __builtin_bit_cast(float32x2_t, (uint64x1_t) {__noswap_vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __rev2_203), __p3_203)})); \ 36823 __ret_203 = __builtin_shufflevector(__ret_203, __ret_203, 1, 0); \ 36824 __ret_203; \ 36825 }) 36826 #endif 36827 36828 #ifdef __LITTLE_ENDIAN__ 36829 #define vcmlaq_rot270_laneq_f32(__p0_204, __p1_204, __p2_204, __p3_204) __extension__ ({ \ 36830 float32x4_t __ret_204; \ 36831 float32x4_t __s0_204 = __p0_204; \ 36832 float32x4_t __s1_204 = __p1_204; \ 36833 float32x4_t __s2_204 = __p2_204; \ 36834 __ret_204 = vcmlaq_rot270_f32(__s0_204, __s1_204, __builtin_bit_cast(float32x4_t, (uint64x2_t) {vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __s2_204), __p3_204), vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __s2_204), __p3_204)})); \ 36835 __ret_204; \ 36836 }) 36837 #else 36838 #define vcmlaq_rot270_laneq_f32(__p0_205, __p1_205, __p2_205, __p3_205) __extension__ ({ \ 36839 float32x4_t __ret_205; \ 36840 float32x4_t __s0_205 = __p0_205; \ 36841 float32x4_t __s1_205 = __p1_205; \ 36842 float32x4_t __s2_205 = __p2_205; \ 36843 float32x4_t __rev0_205; __rev0_205 = __builtin_shufflevector(__s0_205, __s0_205, 3, 2, 1, 0); \ 36844 float32x4_t __rev1_205; __rev1_205 = __builtin_shufflevector(__s1_205, __s1_205, 3, 2, 1, 0); \ 36845 float32x4_t __rev2_205; __rev2_205 = __builtin_shufflevector(__s2_205, __s2_205, 3, 2, 1, 0); \ 36846 __ret_205 = __noswap_vcmlaq_rot270_f32(__rev0_205, __rev1_205, __builtin_bit_cast(float32x4_t, (uint64x2_t) {__noswap_vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __rev2_205), __p3_205), __noswap_vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __rev2_205), __p3_205)})); \ 36847 __ret_205 = __builtin_shufflevector(__ret_205, __ret_205, 3, 2, 1, 0); \ 36848 __ret_205; \ 36849 }) 36850 #endif 36851 36852 #ifdef __LITTLE_ENDIAN__ 36853 __ai __attribute__((target("v8.3a,neon"))) float32x4_t vcmlaq_rot90_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) { 36854 float32x4_t __ret; 36855 __ret = (float32x4_t) __builtin_neon_vcmlaq_rot90_f32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41); 36856 return __ret; 36857 } 36858 #else 36859 __ai __attribute__((target("v8.3a,neon"))) float32x4_t vcmlaq_rot90_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) { 36860 float32x4_t __ret; 36861 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 36862 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 36863 float32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 36864 __ret = (float32x4_t) __builtin_neon_vcmlaq_rot90_f32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 41); 36865 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 36866 return __ret; 36867 } 36868 __ai __attribute__((target("v8.3a,neon"))) float32x4_t __noswap_vcmlaq_rot90_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) { 36869 float32x4_t __ret; 36870 __ret = (float32x4_t) __builtin_neon_vcmlaq_rot90_f32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41); 36871 return __ret; 36872 } 36873 #endif 36874 36875 #ifdef __LITTLE_ENDIAN__ 36876 __ai __attribute__((target("v8.3a,neon"))) float32x2_t vcmla_rot90_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) { 36877 float32x2_t __ret; 36878 __ret = (float32x2_t) __builtin_neon_vcmla_rot90_f32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9); 36879 return __ret; 36880 } 36881 #else 36882 __ai __attribute__((target("v8.3a,neon"))) float32x2_t vcmla_rot90_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) { 36883 float32x2_t __ret; 36884 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 36885 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 36886 float32x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 36887 __ret = (float32x2_t) __builtin_neon_vcmla_rot90_f32((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 9); 36888 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 36889 return __ret; 36890 } 36891 __ai __attribute__((target("v8.3a,neon"))) float32x2_t __noswap_vcmla_rot90_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) { 36892 float32x2_t __ret; 36893 __ret = (float32x2_t) __builtin_neon_vcmla_rot90_f32((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9); 36894 return __ret; 36895 } 36896 #endif 36897 36898 #ifdef __LITTLE_ENDIAN__ 36899 #define vcmla_rot90_lane_f32(__p0_206, __p1_206, __p2_206, __p3_206) __extension__ ({ \ 36900 float32x2_t __ret_206; \ 36901 float32x2_t __s0_206 = __p0_206; \ 36902 float32x2_t __s1_206 = __p1_206; \ 36903 float32x2_t __s2_206 = __p2_206; \ 36904 __ret_206 = vcmla_rot90_f32(__s0_206, __s1_206, __builtin_bit_cast(float32x2_t, (uint64x1_t) {vget_lane_u64(__builtin_bit_cast(uint64x1_t, __s2_206), __p3_206)})); \ 36905 __ret_206; \ 36906 }) 36907 #else 36908 #define vcmla_rot90_lane_f32(__p0_207, __p1_207, __p2_207, __p3_207) __extension__ ({ \ 36909 float32x2_t __ret_207; \ 36910 float32x2_t __s0_207 = __p0_207; \ 36911 float32x2_t __s1_207 = __p1_207; \ 36912 float32x2_t __s2_207 = __p2_207; \ 36913 float32x2_t __rev0_207; __rev0_207 = __builtin_shufflevector(__s0_207, __s0_207, 1, 0); \ 36914 float32x2_t __rev1_207; __rev1_207 = __builtin_shufflevector(__s1_207, __s1_207, 1, 0); \ 36915 float32x2_t __rev2_207; __rev2_207 = __builtin_shufflevector(__s2_207, __s2_207, 1, 0); \ 36916 __ret_207 = __noswap_vcmla_rot90_f32(__rev0_207, __rev1_207, __builtin_bit_cast(float32x2_t, (uint64x1_t) {vget_lane_u64(__builtin_bit_cast(uint64x1_t, __rev2_207), __p3_207)})); \ 36917 __ret_207 = __builtin_shufflevector(__ret_207, __ret_207, 1, 0); \ 36918 __ret_207; \ 36919 }) 36920 #endif 36921 36922 #ifdef __LITTLE_ENDIAN__ 36923 #define vcmlaq_rot90_lane_f32(__p0_208, __p1_208, __p2_208, __p3_208) __extension__ ({ \ 36924 float32x4_t __ret_208; \ 36925 float32x4_t __s0_208 = __p0_208; \ 36926 float32x4_t __s1_208 = __p1_208; \ 36927 float32x2_t __s2_208 = __p2_208; \ 36928 __ret_208 = vcmlaq_rot90_f32(__s0_208, __s1_208, __builtin_bit_cast(float32x4_t, (uint64x2_t) {vget_lane_u64(__builtin_bit_cast(uint64x1_t, __s2_208), __p3_208), vget_lane_u64(__builtin_bit_cast(uint64x1_t, __s2_208), __p3_208)})); \ 36929 __ret_208; \ 36930 }) 36931 #else 36932 #define vcmlaq_rot90_lane_f32(__p0_209, __p1_209, __p2_209, __p3_209) __extension__ ({ \ 36933 float32x4_t __ret_209; \ 36934 float32x4_t __s0_209 = __p0_209; \ 36935 float32x4_t __s1_209 = __p1_209; \ 36936 float32x2_t __s2_209 = __p2_209; \ 36937 float32x4_t __rev0_209; __rev0_209 = __builtin_shufflevector(__s0_209, __s0_209, 3, 2, 1, 0); \ 36938 float32x4_t __rev1_209; __rev1_209 = __builtin_shufflevector(__s1_209, __s1_209, 3, 2, 1, 0); \ 36939 float32x2_t __rev2_209; __rev2_209 = __builtin_shufflevector(__s2_209, __s2_209, 1, 0); \ 36940 __ret_209 = __noswap_vcmlaq_rot90_f32(__rev0_209, __rev1_209, __builtin_bit_cast(float32x4_t, (uint64x2_t) {vget_lane_u64(__builtin_bit_cast(uint64x1_t, __rev2_209), __p3_209), vget_lane_u64(__builtin_bit_cast(uint64x1_t, __rev2_209), __p3_209)})); \ 36941 __ret_209 = __builtin_shufflevector(__ret_209, __ret_209, 3, 2, 1, 0); \ 36942 __ret_209; \ 36943 }) 36944 #endif 36945 36946 #ifdef __LITTLE_ENDIAN__ 36947 #define vcmla_rot90_laneq_f32(__p0_210, __p1_210, __p2_210, __p3_210) __extension__ ({ \ 36948 float32x2_t __ret_210; \ 36949 float32x2_t __s0_210 = __p0_210; \ 36950 float32x2_t __s1_210 = __p1_210; \ 36951 float32x4_t __s2_210 = __p2_210; \ 36952 __ret_210 = vcmla_rot90_f32(__s0_210, __s1_210, __builtin_bit_cast(float32x2_t, (uint64x1_t) {vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __s2_210), __p3_210)})); \ 36953 __ret_210; \ 36954 }) 36955 #else 36956 #define vcmla_rot90_laneq_f32(__p0_211, __p1_211, __p2_211, __p3_211) __extension__ ({ \ 36957 float32x2_t __ret_211; \ 36958 float32x2_t __s0_211 = __p0_211; \ 36959 float32x2_t __s1_211 = __p1_211; \ 36960 float32x4_t __s2_211 = __p2_211; \ 36961 float32x2_t __rev0_211; __rev0_211 = __builtin_shufflevector(__s0_211, __s0_211, 1, 0); \ 36962 float32x2_t __rev1_211; __rev1_211 = __builtin_shufflevector(__s1_211, __s1_211, 1, 0); \ 36963 float32x4_t __rev2_211; __rev2_211 = __builtin_shufflevector(__s2_211, __s2_211, 3, 2, 1, 0); \ 36964 __ret_211 = __noswap_vcmla_rot90_f32(__rev0_211, __rev1_211, __builtin_bit_cast(float32x2_t, (uint64x1_t) {__noswap_vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __rev2_211), __p3_211)})); \ 36965 __ret_211 = __builtin_shufflevector(__ret_211, __ret_211, 1, 0); \ 36966 __ret_211; \ 36967 }) 36968 #endif 36969 36970 #ifdef __LITTLE_ENDIAN__ 36971 #define vcmlaq_rot90_laneq_f32(__p0_212, __p1_212, __p2_212, __p3_212) __extension__ ({ \ 36972 float32x4_t __ret_212; \ 36973 float32x4_t __s0_212 = __p0_212; \ 36974 float32x4_t __s1_212 = __p1_212; \ 36975 float32x4_t __s2_212 = __p2_212; \ 36976 __ret_212 = vcmlaq_rot90_f32(__s0_212, __s1_212, __builtin_bit_cast(float32x4_t, (uint64x2_t) {vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __s2_212), __p3_212), vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __s2_212), __p3_212)})); \ 36977 __ret_212; \ 36978 }) 36979 #else 36980 #define vcmlaq_rot90_laneq_f32(__p0_213, __p1_213, __p2_213, __p3_213) __extension__ ({ \ 36981 float32x4_t __ret_213; \ 36982 float32x4_t __s0_213 = __p0_213; \ 36983 float32x4_t __s1_213 = __p1_213; \ 36984 float32x4_t __s2_213 = __p2_213; \ 36985 float32x4_t __rev0_213; __rev0_213 = __builtin_shufflevector(__s0_213, __s0_213, 3, 2, 1, 0); \ 36986 float32x4_t __rev1_213; __rev1_213 = __builtin_shufflevector(__s1_213, __s1_213, 3, 2, 1, 0); \ 36987 float32x4_t __rev2_213; __rev2_213 = __builtin_shufflevector(__s2_213, __s2_213, 3, 2, 1, 0); \ 36988 __ret_213 = __noswap_vcmlaq_rot90_f32(__rev0_213, __rev1_213, __builtin_bit_cast(float32x4_t, (uint64x2_t) {__noswap_vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __rev2_213), __p3_213), __noswap_vgetq_lane_u64(__builtin_bit_cast(uint64x2_t, __rev2_213), __p3_213)})); \ 36989 __ret_213 = __builtin_shufflevector(__ret_213, __ret_213, 3, 2, 1, 0); \ 36990 __ret_213; \ 36991 }) 36992 #endif 36993 36994 #if !defined(__aarch64__) && !defined(__arm64ec__) 36995 #ifdef __LITTLE_ENDIAN__ 36996 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t __a32_vcvt_bf16_f32(float32x4_t __p0) { 36997 bfloat16x4_t __ret; 36998 __ret = (bfloat16x4_t) __builtin_neon___a32_vcvt_bf16_f32((int8x16_t)__p0, 11); 36999 return __ret; 37000 } 37001 #else 37002 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t __a32_vcvt_bf16_f32(float32x4_t __p0) { 37003 bfloat16x4_t __ret; 37004 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 37005 __ret = (bfloat16x4_t) __builtin_neon___a32_vcvt_bf16_f32((int8x16_t)__rev0, 11); 37006 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 37007 return __ret; 37008 } 37009 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t __noswap___a32_vcvt_bf16_f32(float32x4_t __p0) { 37010 bfloat16x4_t __ret; 37011 __ret = (bfloat16x4_t) __builtin_neon___a32_vcvt_bf16_f32((int8x16_t)__p0, 11); 37012 return __ret; 37013 } 37014 #endif 37015 37016 #ifdef __LITTLE_ENDIAN__ 37017 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vcvt_bf16_f32(float32x4_t __p0) { 37018 bfloat16x4_t __ret; 37019 __ret = __a32_vcvt_bf16_f32(__p0); 37020 return __ret; 37021 } 37022 #else 37023 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vcvt_bf16_f32(float32x4_t __p0) { 37024 bfloat16x4_t __ret; 37025 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 37026 __ret = __noswap___a32_vcvt_bf16_f32(__rev0); 37027 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 37028 return __ret; 37029 } 37030 #endif 37031 37032 #ifdef __LITTLE_ENDIAN__ 37033 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vcvtq_high_bf16_f32(bfloat16x8_t __p0, float32x4_t __p1) { 37034 bfloat16x8_t __ret; 37035 __ret = vcombine_bf16(__a32_vcvt_bf16_f32(__p1), vget_low_bf16(__p0)); 37036 return __ret; 37037 } 37038 #else 37039 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vcvtq_high_bf16_f32(bfloat16x8_t __p0, float32x4_t __p1) { 37040 bfloat16x8_t __ret; 37041 bfloat16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 37042 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 37043 __ret = __noswap_vcombine_bf16(__noswap___a32_vcvt_bf16_f32(__rev1), __noswap_vget_low_bf16(__rev0)); 37044 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 37045 return __ret; 37046 } 37047 #endif 37048 37049 #ifdef __LITTLE_ENDIAN__ 37050 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vcvtq_low_bf16_f32(float32x4_t __p0) { 37051 bfloat16x8_t __ret; 37052 __ret = vcombine_bf16((bfloat16x4_t)(0ULL), __a32_vcvt_bf16_f32(__p0)); 37053 return __ret; 37054 } 37055 #else 37056 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vcvtq_low_bf16_f32(float32x4_t __p0) { 37057 bfloat16x8_t __ret; 37058 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 37059 __ret = __noswap_vcombine_bf16((bfloat16x4_t)(0ULL), __noswap___a32_vcvt_bf16_f32(__rev0)); 37060 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 37061 return __ret; 37062 } 37063 #endif 37064 37065 __ai __attribute__((target("bf16,neon"))) poly8x8_t vreinterpret_p8_bf16(bfloat16x4_t __p0) { 37066 poly8x8_t __ret; 37067 __ret = (poly8x8_t)(__p0); 37068 return __ret; 37069 } 37070 __ai __attribute__((target("bf16,neon"))) poly64x1_t vreinterpret_p64_bf16(bfloat16x4_t __p0) { 37071 poly64x1_t __ret; 37072 __ret = (poly64x1_t)(__p0); 37073 return __ret; 37074 } 37075 __ai __attribute__((target("bf16,neon"))) poly16x4_t vreinterpret_p16_bf16(bfloat16x4_t __p0) { 37076 poly16x4_t __ret; 37077 __ret = (poly16x4_t)(__p0); 37078 return __ret; 37079 } 37080 __ai __attribute__((target("bf16,neon"))) poly8x16_t vreinterpretq_p8_bf16(bfloat16x8_t __p0) { 37081 poly8x16_t __ret; 37082 __ret = (poly8x16_t)(__p0); 37083 return __ret; 37084 } 37085 __ai __attribute__((target("bf16,neon"))) poly64x2_t vreinterpretq_p64_bf16(bfloat16x8_t __p0) { 37086 poly64x2_t __ret; 37087 __ret = (poly64x2_t)(__p0); 37088 return __ret; 37089 } 37090 __ai __attribute__((target("bf16,neon"))) poly16x8_t vreinterpretq_p16_bf16(bfloat16x8_t __p0) { 37091 poly16x8_t __ret; 37092 __ret = (poly16x8_t)(__p0); 37093 return __ret; 37094 } 37095 __ai __attribute__((target("bf16,neon"))) uint8x16_t vreinterpretq_u8_bf16(bfloat16x8_t __p0) { 37096 uint8x16_t __ret; 37097 __ret = (uint8x16_t)(__p0); 37098 return __ret; 37099 } 37100 __ai __attribute__((target("bf16,neon"))) uint32x4_t vreinterpretq_u32_bf16(bfloat16x8_t __p0) { 37101 uint32x4_t __ret; 37102 __ret = (uint32x4_t)(__p0); 37103 return __ret; 37104 } 37105 __ai __attribute__((target("bf16,neon"))) uint64x2_t vreinterpretq_u64_bf16(bfloat16x8_t __p0) { 37106 uint64x2_t __ret; 37107 __ret = (uint64x2_t)(__p0); 37108 return __ret; 37109 } 37110 __ai __attribute__((target("bf16,neon"))) uint16x8_t vreinterpretq_u16_bf16(bfloat16x8_t __p0) { 37111 uint16x8_t __ret; 37112 __ret = (uint16x8_t)(__p0); 37113 return __ret; 37114 } 37115 __ai __attribute__((target("bf16,neon"))) int8x16_t vreinterpretq_s8_bf16(bfloat16x8_t __p0) { 37116 int8x16_t __ret; 37117 __ret = (int8x16_t)(__p0); 37118 return __ret; 37119 } 37120 __ai __attribute__((target("bf16,neon"))) float32x4_t vreinterpretq_f32_bf16(bfloat16x8_t __p0) { 37121 float32x4_t __ret; 37122 __ret = (float32x4_t)(__p0); 37123 return __ret; 37124 } 37125 __ai __attribute__((target("bf16,neon"))) float16x8_t vreinterpretq_f16_bf16(bfloat16x8_t __p0) { 37126 float16x8_t __ret; 37127 __ret = (float16x8_t)(__p0); 37128 return __ret; 37129 } 37130 __ai __attribute__((target("bf16,neon"))) int32x4_t vreinterpretq_s32_bf16(bfloat16x8_t __p0) { 37131 int32x4_t __ret; 37132 __ret = (int32x4_t)(__p0); 37133 return __ret; 37134 } 37135 __ai __attribute__((target("bf16,neon"))) int64x2_t vreinterpretq_s64_bf16(bfloat16x8_t __p0) { 37136 int64x2_t __ret; 37137 __ret = (int64x2_t)(__p0); 37138 return __ret; 37139 } 37140 __ai __attribute__((target("bf16,neon"))) int16x8_t vreinterpretq_s16_bf16(bfloat16x8_t __p0) { 37141 int16x8_t __ret; 37142 __ret = (int16x8_t)(__p0); 37143 return __ret; 37144 } 37145 __ai __attribute__((target("bf16,neon"))) uint8x8_t vreinterpret_u8_bf16(bfloat16x4_t __p0) { 37146 uint8x8_t __ret; 37147 __ret = (uint8x8_t)(__p0); 37148 return __ret; 37149 } 37150 __ai __attribute__((target("bf16,neon"))) uint32x2_t vreinterpret_u32_bf16(bfloat16x4_t __p0) { 37151 uint32x2_t __ret; 37152 __ret = (uint32x2_t)(__p0); 37153 return __ret; 37154 } 37155 __ai __attribute__((target("bf16,neon"))) uint64x1_t vreinterpret_u64_bf16(bfloat16x4_t __p0) { 37156 uint64x1_t __ret; 37157 __ret = (uint64x1_t)(__p0); 37158 return __ret; 37159 } 37160 __ai __attribute__((target("bf16,neon"))) uint16x4_t vreinterpret_u16_bf16(bfloat16x4_t __p0) { 37161 uint16x4_t __ret; 37162 __ret = (uint16x4_t)(__p0); 37163 return __ret; 37164 } 37165 __ai __attribute__((target("bf16,neon"))) int8x8_t vreinterpret_s8_bf16(bfloat16x4_t __p0) { 37166 int8x8_t __ret; 37167 __ret = (int8x8_t)(__p0); 37168 return __ret; 37169 } 37170 __ai __attribute__((target("bf16,neon"))) float32x2_t vreinterpret_f32_bf16(bfloat16x4_t __p0) { 37171 float32x2_t __ret; 37172 __ret = (float32x2_t)(__p0); 37173 return __ret; 37174 } 37175 __ai __attribute__((target("bf16,neon"))) float16x4_t vreinterpret_f16_bf16(bfloat16x4_t __p0) { 37176 float16x4_t __ret; 37177 __ret = (float16x4_t)(__p0); 37178 return __ret; 37179 } 37180 __ai __attribute__((target("bf16,neon"))) int32x2_t vreinterpret_s32_bf16(bfloat16x4_t __p0) { 37181 int32x2_t __ret; 37182 __ret = (int32x2_t)(__p0); 37183 return __ret; 37184 } 37185 __ai __attribute__((target("bf16,neon"))) int64x1_t vreinterpret_s64_bf16(bfloat16x4_t __p0) { 37186 int64x1_t __ret; 37187 __ret = (int64x1_t)(__p0); 37188 return __ret; 37189 } 37190 __ai __attribute__((target("bf16,neon"))) int16x4_t vreinterpret_s16_bf16(bfloat16x4_t __p0) { 37191 int16x4_t __ret; 37192 __ret = (int16x4_t)(__p0); 37193 return __ret; 37194 } 37195 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_p8(poly8x16_t __p0) { 37196 bfloat16x8_t __ret; 37197 __ret = (bfloat16x8_t)(__p0); 37198 return __ret; 37199 } 37200 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_p64(poly64x2_t __p0) { 37201 bfloat16x8_t __ret; 37202 __ret = (bfloat16x8_t)(__p0); 37203 return __ret; 37204 } 37205 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_p16(poly16x8_t __p0) { 37206 bfloat16x8_t __ret; 37207 __ret = (bfloat16x8_t)(__p0); 37208 return __ret; 37209 } 37210 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_u8(uint8x16_t __p0) { 37211 bfloat16x8_t __ret; 37212 __ret = (bfloat16x8_t)(__p0); 37213 return __ret; 37214 } 37215 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_u32(uint32x4_t __p0) { 37216 bfloat16x8_t __ret; 37217 __ret = (bfloat16x8_t)(__p0); 37218 return __ret; 37219 } 37220 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_u64(uint64x2_t __p0) { 37221 bfloat16x8_t __ret; 37222 __ret = (bfloat16x8_t)(__p0); 37223 return __ret; 37224 } 37225 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_u16(uint16x8_t __p0) { 37226 bfloat16x8_t __ret; 37227 __ret = (bfloat16x8_t)(__p0); 37228 return __ret; 37229 } 37230 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_s8(int8x16_t __p0) { 37231 bfloat16x8_t __ret; 37232 __ret = (bfloat16x8_t)(__p0); 37233 return __ret; 37234 } 37235 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_f32(float32x4_t __p0) { 37236 bfloat16x8_t __ret; 37237 __ret = (bfloat16x8_t)(__p0); 37238 return __ret; 37239 } 37240 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_f16(float16x8_t __p0) { 37241 bfloat16x8_t __ret; 37242 __ret = (bfloat16x8_t)(__p0); 37243 return __ret; 37244 } 37245 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_s32(int32x4_t __p0) { 37246 bfloat16x8_t __ret; 37247 __ret = (bfloat16x8_t)(__p0); 37248 return __ret; 37249 } 37250 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_s64(int64x2_t __p0) { 37251 bfloat16x8_t __ret; 37252 __ret = (bfloat16x8_t)(__p0); 37253 return __ret; 37254 } 37255 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_s16(int16x8_t __p0) { 37256 bfloat16x8_t __ret; 37257 __ret = (bfloat16x8_t)(__p0); 37258 return __ret; 37259 } 37260 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_p8(poly8x8_t __p0) { 37261 bfloat16x4_t __ret; 37262 __ret = (bfloat16x4_t)(__p0); 37263 return __ret; 37264 } 37265 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_p64(poly64x1_t __p0) { 37266 bfloat16x4_t __ret; 37267 __ret = (bfloat16x4_t)(__p0); 37268 return __ret; 37269 } 37270 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_p16(poly16x4_t __p0) { 37271 bfloat16x4_t __ret; 37272 __ret = (bfloat16x4_t)(__p0); 37273 return __ret; 37274 } 37275 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_u8(uint8x8_t __p0) { 37276 bfloat16x4_t __ret; 37277 __ret = (bfloat16x4_t)(__p0); 37278 return __ret; 37279 } 37280 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_u32(uint32x2_t __p0) { 37281 bfloat16x4_t __ret; 37282 __ret = (bfloat16x4_t)(__p0); 37283 return __ret; 37284 } 37285 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_u64(uint64x1_t __p0) { 37286 bfloat16x4_t __ret; 37287 __ret = (bfloat16x4_t)(__p0); 37288 return __ret; 37289 } 37290 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_u16(uint16x4_t __p0) { 37291 bfloat16x4_t __ret; 37292 __ret = (bfloat16x4_t)(__p0); 37293 return __ret; 37294 } 37295 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_s8(int8x8_t __p0) { 37296 bfloat16x4_t __ret; 37297 __ret = (bfloat16x4_t)(__p0); 37298 return __ret; 37299 } 37300 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_f32(float32x2_t __p0) { 37301 bfloat16x4_t __ret; 37302 __ret = (bfloat16x4_t)(__p0); 37303 return __ret; 37304 } 37305 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_f16(float16x4_t __p0) { 37306 bfloat16x4_t __ret; 37307 __ret = (bfloat16x4_t)(__p0); 37308 return __ret; 37309 } 37310 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_s32(int32x2_t __p0) { 37311 bfloat16x4_t __ret; 37312 __ret = (bfloat16x4_t)(__p0); 37313 return __ret; 37314 } 37315 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_s64(int64x1_t __p0) { 37316 bfloat16x4_t __ret; 37317 __ret = (bfloat16x4_t)(__p0); 37318 return __ret; 37319 } 37320 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_s16(int16x4_t __p0) { 37321 bfloat16x4_t __ret; 37322 __ret = (bfloat16x4_t)(__p0); 37323 return __ret; 37324 } 37325 #ifdef __LITTLE_ENDIAN__ 37326 #define vqdmulhq_lane_s32(__p0_214, __p1_214, __p2_214) __extension__ ({ \ 37327 int32x4_t __ret_214; \ 37328 int32x4_t __s0_214 = __p0_214; \ 37329 int32x2_t __s1_214 = __p1_214; \ 37330 __ret_214 = vqdmulhq_s32(__s0_214, splatq_lane_s32(__s1_214, __p2_214)); \ 37331 __ret_214; \ 37332 }) 37333 #else 37334 #define vqdmulhq_lane_s32(__p0_215, __p1_215, __p2_215) __extension__ ({ \ 37335 int32x4_t __ret_215; \ 37336 int32x4_t __s0_215 = __p0_215; \ 37337 int32x2_t __s1_215 = __p1_215; \ 37338 int32x4_t __rev0_215; __rev0_215 = __builtin_shufflevector(__s0_215, __s0_215, 3, 2, 1, 0); \ 37339 int32x2_t __rev1_215; __rev1_215 = __builtin_shufflevector(__s1_215, __s1_215, 1, 0); \ 37340 __ret_215 = __noswap_vqdmulhq_s32(__rev0_215, __noswap_splatq_lane_s32(__rev1_215, __p2_215)); \ 37341 __ret_215 = __builtin_shufflevector(__ret_215, __ret_215, 3, 2, 1, 0); \ 37342 __ret_215; \ 37343 }) 37344 #endif 37345 37346 #ifdef __LITTLE_ENDIAN__ 37347 #define vqdmulhq_lane_s16(__p0_216, __p1_216, __p2_216) __extension__ ({ \ 37348 int16x8_t __ret_216; \ 37349 int16x8_t __s0_216 = __p0_216; \ 37350 int16x4_t __s1_216 = __p1_216; \ 37351 __ret_216 = vqdmulhq_s16(__s0_216, splatq_lane_s16(__s1_216, __p2_216)); \ 37352 __ret_216; \ 37353 }) 37354 #else 37355 #define vqdmulhq_lane_s16(__p0_217, __p1_217, __p2_217) __extension__ ({ \ 37356 int16x8_t __ret_217; \ 37357 int16x8_t __s0_217 = __p0_217; \ 37358 int16x4_t __s1_217 = __p1_217; \ 37359 int16x8_t __rev0_217; __rev0_217 = __builtin_shufflevector(__s0_217, __s0_217, 7, 6, 5, 4, 3, 2, 1, 0); \ 37360 int16x4_t __rev1_217; __rev1_217 = __builtin_shufflevector(__s1_217, __s1_217, 3, 2, 1, 0); \ 37361 __ret_217 = __noswap_vqdmulhq_s16(__rev0_217, __noswap_splatq_lane_s16(__rev1_217, __p2_217)); \ 37362 __ret_217 = __builtin_shufflevector(__ret_217, __ret_217, 7, 6, 5, 4, 3, 2, 1, 0); \ 37363 __ret_217; \ 37364 }) 37365 #endif 37366 37367 #ifdef __LITTLE_ENDIAN__ 37368 #define vqdmulh_lane_s32(__p0_218, __p1_218, __p2_218) __extension__ ({ \ 37369 int32x2_t __ret_218; \ 37370 int32x2_t __s0_218 = __p0_218; \ 37371 int32x2_t __s1_218 = __p1_218; \ 37372 __ret_218 = vqdmulh_s32(__s0_218, splat_lane_s32(__s1_218, __p2_218)); \ 37373 __ret_218; \ 37374 }) 37375 #else 37376 #define vqdmulh_lane_s32(__p0_219, __p1_219, __p2_219) __extension__ ({ \ 37377 int32x2_t __ret_219; \ 37378 int32x2_t __s0_219 = __p0_219; \ 37379 int32x2_t __s1_219 = __p1_219; \ 37380 int32x2_t __rev0_219; __rev0_219 = __builtin_shufflevector(__s0_219, __s0_219, 1, 0); \ 37381 int32x2_t __rev1_219; __rev1_219 = __builtin_shufflevector(__s1_219, __s1_219, 1, 0); \ 37382 __ret_219 = __noswap_vqdmulh_s32(__rev0_219, __noswap_splat_lane_s32(__rev1_219, __p2_219)); \ 37383 __ret_219 = __builtin_shufflevector(__ret_219, __ret_219, 1, 0); \ 37384 __ret_219; \ 37385 }) 37386 #endif 37387 37388 #ifdef __LITTLE_ENDIAN__ 37389 #define vqdmulh_lane_s16(__p0_220, __p1_220, __p2_220) __extension__ ({ \ 37390 int16x4_t __ret_220; \ 37391 int16x4_t __s0_220 = __p0_220; \ 37392 int16x4_t __s1_220 = __p1_220; \ 37393 __ret_220 = vqdmulh_s16(__s0_220, splat_lane_s16(__s1_220, __p2_220)); \ 37394 __ret_220; \ 37395 }) 37396 #else 37397 #define vqdmulh_lane_s16(__p0_221, __p1_221, __p2_221) __extension__ ({ \ 37398 int16x4_t __ret_221; \ 37399 int16x4_t __s0_221 = __p0_221; \ 37400 int16x4_t __s1_221 = __p1_221; \ 37401 int16x4_t __rev0_221; __rev0_221 = __builtin_shufflevector(__s0_221, __s0_221, 3, 2, 1, 0); \ 37402 int16x4_t __rev1_221; __rev1_221 = __builtin_shufflevector(__s1_221, __s1_221, 3, 2, 1, 0); \ 37403 __ret_221 = __noswap_vqdmulh_s16(__rev0_221, __noswap_splat_lane_s16(__rev1_221, __p2_221)); \ 37404 __ret_221 = __builtin_shufflevector(__ret_221, __ret_221, 3, 2, 1, 0); \ 37405 __ret_221; \ 37406 }) 37407 #endif 37408 37409 #ifdef __LITTLE_ENDIAN__ 37410 #define vqrdmulhq_lane_s32(__p0_222, __p1_222, __p2_222) __extension__ ({ \ 37411 int32x4_t __ret_222; \ 37412 int32x4_t __s0_222 = __p0_222; \ 37413 int32x2_t __s1_222 = __p1_222; \ 37414 __ret_222 = vqrdmulhq_s32(__s0_222, splatq_lane_s32(__s1_222, __p2_222)); \ 37415 __ret_222; \ 37416 }) 37417 #else 37418 #define vqrdmulhq_lane_s32(__p0_223, __p1_223, __p2_223) __extension__ ({ \ 37419 int32x4_t __ret_223; \ 37420 int32x4_t __s0_223 = __p0_223; \ 37421 int32x2_t __s1_223 = __p1_223; \ 37422 int32x4_t __rev0_223; __rev0_223 = __builtin_shufflevector(__s0_223, __s0_223, 3, 2, 1, 0); \ 37423 int32x2_t __rev1_223; __rev1_223 = __builtin_shufflevector(__s1_223, __s1_223, 1, 0); \ 37424 __ret_223 = __noswap_vqrdmulhq_s32(__rev0_223, __noswap_splatq_lane_s32(__rev1_223, __p2_223)); \ 37425 __ret_223 = __builtin_shufflevector(__ret_223, __ret_223, 3, 2, 1, 0); \ 37426 __ret_223; \ 37427 }) 37428 #endif 37429 37430 #ifdef __LITTLE_ENDIAN__ 37431 #define vqrdmulhq_lane_s16(__p0_224, __p1_224, __p2_224) __extension__ ({ \ 37432 int16x8_t __ret_224; \ 37433 int16x8_t __s0_224 = __p0_224; \ 37434 int16x4_t __s1_224 = __p1_224; \ 37435 __ret_224 = vqrdmulhq_s16(__s0_224, splatq_lane_s16(__s1_224, __p2_224)); \ 37436 __ret_224; \ 37437 }) 37438 #else 37439 #define vqrdmulhq_lane_s16(__p0_225, __p1_225, __p2_225) __extension__ ({ \ 37440 int16x8_t __ret_225; \ 37441 int16x8_t __s0_225 = __p0_225; \ 37442 int16x4_t __s1_225 = __p1_225; \ 37443 int16x8_t __rev0_225; __rev0_225 = __builtin_shufflevector(__s0_225, __s0_225, 7, 6, 5, 4, 3, 2, 1, 0); \ 37444 int16x4_t __rev1_225; __rev1_225 = __builtin_shufflevector(__s1_225, __s1_225, 3, 2, 1, 0); \ 37445 __ret_225 = __noswap_vqrdmulhq_s16(__rev0_225, __noswap_splatq_lane_s16(__rev1_225, __p2_225)); \ 37446 __ret_225 = __builtin_shufflevector(__ret_225, __ret_225, 7, 6, 5, 4, 3, 2, 1, 0); \ 37447 __ret_225; \ 37448 }) 37449 #endif 37450 37451 #ifdef __LITTLE_ENDIAN__ 37452 #define vqrdmulh_lane_s32(__p0_226, __p1_226, __p2_226) __extension__ ({ \ 37453 int32x2_t __ret_226; \ 37454 int32x2_t __s0_226 = __p0_226; \ 37455 int32x2_t __s1_226 = __p1_226; \ 37456 __ret_226 = vqrdmulh_s32(__s0_226, splat_lane_s32(__s1_226, __p2_226)); \ 37457 __ret_226; \ 37458 }) 37459 #else 37460 #define vqrdmulh_lane_s32(__p0_227, __p1_227, __p2_227) __extension__ ({ \ 37461 int32x2_t __ret_227; \ 37462 int32x2_t __s0_227 = __p0_227; \ 37463 int32x2_t __s1_227 = __p1_227; \ 37464 int32x2_t __rev0_227; __rev0_227 = __builtin_shufflevector(__s0_227, __s0_227, 1, 0); \ 37465 int32x2_t __rev1_227; __rev1_227 = __builtin_shufflevector(__s1_227, __s1_227, 1, 0); \ 37466 __ret_227 = __noswap_vqrdmulh_s32(__rev0_227, __noswap_splat_lane_s32(__rev1_227, __p2_227)); \ 37467 __ret_227 = __builtin_shufflevector(__ret_227, __ret_227, 1, 0); \ 37468 __ret_227; \ 37469 }) 37470 #endif 37471 37472 #ifdef __LITTLE_ENDIAN__ 37473 #define vqrdmulh_lane_s16(__p0_228, __p1_228, __p2_228) __extension__ ({ \ 37474 int16x4_t __ret_228; \ 37475 int16x4_t __s0_228 = __p0_228; \ 37476 int16x4_t __s1_228 = __p1_228; \ 37477 __ret_228 = vqrdmulh_s16(__s0_228, splat_lane_s16(__s1_228, __p2_228)); \ 37478 __ret_228; \ 37479 }) 37480 #else 37481 #define vqrdmulh_lane_s16(__p0_229, __p1_229, __p2_229) __extension__ ({ \ 37482 int16x4_t __ret_229; \ 37483 int16x4_t __s0_229 = __p0_229; \ 37484 int16x4_t __s1_229 = __p1_229; \ 37485 int16x4_t __rev0_229; __rev0_229 = __builtin_shufflevector(__s0_229, __s0_229, 3, 2, 1, 0); \ 37486 int16x4_t __rev1_229; __rev1_229 = __builtin_shufflevector(__s1_229, __s1_229, 3, 2, 1, 0); \ 37487 __ret_229 = __noswap_vqrdmulh_s16(__rev0_229, __noswap_splat_lane_s16(__rev1_229, __p2_229)); \ 37488 __ret_229 = __builtin_shufflevector(__ret_229, __ret_229, 3, 2, 1, 0); \ 37489 __ret_229; \ 37490 }) 37491 #endif 37492 37493 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_p16(poly16x4_t __p0) { 37494 poly8x8_t __ret; 37495 __ret = (poly8x8_t)(__p0); 37496 return __ret; 37497 } 37498 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_u8(uint8x8_t __p0) { 37499 poly8x8_t __ret; 37500 __ret = (poly8x8_t)(__p0); 37501 return __ret; 37502 } 37503 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_u32(uint32x2_t __p0) { 37504 poly8x8_t __ret; 37505 __ret = (poly8x8_t)(__p0); 37506 return __ret; 37507 } 37508 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_u64(uint64x1_t __p0) { 37509 poly8x8_t __ret; 37510 __ret = (poly8x8_t)(__p0); 37511 return __ret; 37512 } 37513 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_u16(uint16x4_t __p0) { 37514 poly8x8_t __ret; 37515 __ret = (poly8x8_t)(__p0); 37516 return __ret; 37517 } 37518 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_s8(int8x8_t __p0) { 37519 poly8x8_t __ret; 37520 __ret = (poly8x8_t)(__p0); 37521 return __ret; 37522 } 37523 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_f32(float32x2_t __p0) { 37524 poly8x8_t __ret; 37525 __ret = (poly8x8_t)(__p0); 37526 return __ret; 37527 } 37528 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_f16(float16x4_t __p0) { 37529 poly8x8_t __ret; 37530 __ret = (poly8x8_t)(__p0); 37531 return __ret; 37532 } 37533 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_s32(int32x2_t __p0) { 37534 poly8x8_t __ret; 37535 __ret = (poly8x8_t)(__p0); 37536 return __ret; 37537 } 37538 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_s64(int64x1_t __p0) { 37539 poly8x8_t __ret; 37540 __ret = (poly8x8_t)(__p0); 37541 return __ret; 37542 } 37543 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_s16(int16x4_t __p0) { 37544 poly8x8_t __ret; 37545 __ret = (poly8x8_t)(__p0); 37546 return __ret; 37547 } 37548 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_p8(poly8x8_t __p0) { 37549 poly16x4_t __ret; 37550 __ret = (poly16x4_t)(__p0); 37551 return __ret; 37552 } 37553 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_u8(uint8x8_t __p0) { 37554 poly16x4_t __ret; 37555 __ret = (poly16x4_t)(__p0); 37556 return __ret; 37557 } 37558 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_u32(uint32x2_t __p0) { 37559 poly16x4_t __ret; 37560 __ret = (poly16x4_t)(__p0); 37561 return __ret; 37562 } 37563 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_u64(uint64x1_t __p0) { 37564 poly16x4_t __ret; 37565 __ret = (poly16x4_t)(__p0); 37566 return __ret; 37567 } 37568 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_u16(uint16x4_t __p0) { 37569 poly16x4_t __ret; 37570 __ret = (poly16x4_t)(__p0); 37571 return __ret; 37572 } 37573 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_s8(int8x8_t __p0) { 37574 poly16x4_t __ret; 37575 __ret = (poly16x4_t)(__p0); 37576 return __ret; 37577 } 37578 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_f32(float32x2_t __p0) { 37579 poly16x4_t __ret; 37580 __ret = (poly16x4_t)(__p0); 37581 return __ret; 37582 } 37583 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_f16(float16x4_t __p0) { 37584 poly16x4_t __ret; 37585 __ret = (poly16x4_t)(__p0); 37586 return __ret; 37587 } 37588 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_s32(int32x2_t __p0) { 37589 poly16x4_t __ret; 37590 __ret = (poly16x4_t)(__p0); 37591 return __ret; 37592 } 37593 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_s64(int64x1_t __p0) { 37594 poly16x4_t __ret; 37595 __ret = (poly16x4_t)(__p0); 37596 return __ret; 37597 } 37598 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_s16(int16x4_t __p0) { 37599 poly16x4_t __ret; 37600 __ret = (poly16x4_t)(__p0); 37601 return __ret; 37602 } 37603 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_p16(poly16x8_t __p0) { 37604 poly8x16_t __ret; 37605 __ret = (poly8x16_t)(__p0); 37606 return __ret; 37607 } 37608 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_u8(uint8x16_t __p0) { 37609 poly8x16_t __ret; 37610 __ret = (poly8x16_t)(__p0); 37611 return __ret; 37612 } 37613 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_u32(uint32x4_t __p0) { 37614 poly8x16_t __ret; 37615 __ret = (poly8x16_t)(__p0); 37616 return __ret; 37617 } 37618 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_u64(uint64x2_t __p0) { 37619 poly8x16_t __ret; 37620 __ret = (poly8x16_t)(__p0); 37621 return __ret; 37622 } 37623 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_u16(uint16x8_t __p0) { 37624 poly8x16_t __ret; 37625 __ret = (poly8x16_t)(__p0); 37626 return __ret; 37627 } 37628 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_s8(int8x16_t __p0) { 37629 poly8x16_t __ret; 37630 __ret = (poly8x16_t)(__p0); 37631 return __ret; 37632 } 37633 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_f32(float32x4_t __p0) { 37634 poly8x16_t __ret; 37635 __ret = (poly8x16_t)(__p0); 37636 return __ret; 37637 } 37638 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_f16(float16x8_t __p0) { 37639 poly8x16_t __ret; 37640 __ret = (poly8x16_t)(__p0); 37641 return __ret; 37642 } 37643 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_s32(int32x4_t __p0) { 37644 poly8x16_t __ret; 37645 __ret = (poly8x16_t)(__p0); 37646 return __ret; 37647 } 37648 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_s64(int64x2_t __p0) { 37649 poly8x16_t __ret; 37650 __ret = (poly8x16_t)(__p0); 37651 return __ret; 37652 } 37653 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_s16(int16x8_t __p0) { 37654 poly8x16_t __ret; 37655 __ret = (poly8x16_t)(__p0); 37656 return __ret; 37657 } 37658 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_p8(poly8x16_t __p0) { 37659 poly16x8_t __ret; 37660 __ret = (poly16x8_t)(__p0); 37661 return __ret; 37662 } 37663 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_u8(uint8x16_t __p0) { 37664 poly16x8_t __ret; 37665 __ret = (poly16x8_t)(__p0); 37666 return __ret; 37667 } 37668 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_u32(uint32x4_t __p0) { 37669 poly16x8_t __ret; 37670 __ret = (poly16x8_t)(__p0); 37671 return __ret; 37672 } 37673 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_u64(uint64x2_t __p0) { 37674 poly16x8_t __ret; 37675 __ret = (poly16x8_t)(__p0); 37676 return __ret; 37677 } 37678 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_u16(uint16x8_t __p0) { 37679 poly16x8_t __ret; 37680 __ret = (poly16x8_t)(__p0); 37681 return __ret; 37682 } 37683 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_s8(int8x16_t __p0) { 37684 poly16x8_t __ret; 37685 __ret = (poly16x8_t)(__p0); 37686 return __ret; 37687 } 37688 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_f32(float32x4_t __p0) { 37689 poly16x8_t __ret; 37690 __ret = (poly16x8_t)(__p0); 37691 return __ret; 37692 } 37693 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_f16(float16x8_t __p0) { 37694 poly16x8_t __ret; 37695 __ret = (poly16x8_t)(__p0); 37696 return __ret; 37697 } 37698 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_s32(int32x4_t __p0) { 37699 poly16x8_t __ret; 37700 __ret = (poly16x8_t)(__p0); 37701 return __ret; 37702 } 37703 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_s64(int64x2_t __p0) { 37704 poly16x8_t __ret; 37705 __ret = (poly16x8_t)(__p0); 37706 return __ret; 37707 } 37708 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_s16(int16x8_t __p0) { 37709 poly16x8_t __ret; 37710 __ret = (poly16x8_t)(__p0); 37711 return __ret; 37712 } 37713 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_p8(poly8x16_t __p0) { 37714 uint8x16_t __ret; 37715 __ret = (uint8x16_t)(__p0); 37716 return __ret; 37717 } 37718 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_p16(poly16x8_t __p0) { 37719 uint8x16_t __ret; 37720 __ret = (uint8x16_t)(__p0); 37721 return __ret; 37722 } 37723 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_u32(uint32x4_t __p0) { 37724 uint8x16_t __ret; 37725 __ret = (uint8x16_t)(__p0); 37726 return __ret; 37727 } 37728 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_u64(uint64x2_t __p0) { 37729 uint8x16_t __ret; 37730 __ret = (uint8x16_t)(__p0); 37731 return __ret; 37732 } 37733 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_u16(uint16x8_t __p0) { 37734 uint8x16_t __ret; 37735 __ret = (uint8x16_t)(__p0); 37736 return __ret; 37737 } 37738 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_s8(int8x16_t __p0) { 37739 uint8x16_t __ret; 37740 __ret = (uint8x16_t)(__p0); 37741 return __ret; 37742 } 37743 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_f32(float32x4_t __p0) { 37744 uint8x16_t __ret; 37745 __ret = (uint8x16_t)(__p0); 37746 return __ret; 37747 } 37748 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_f16(float16x8_t __p0) { 37749 uint8x16_t __ret; 37750 __ret = (uint8x16_t)(__p0); 37751 return __ret; 37752 } 37753 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_s32(int32x4_t __p0) { 37754 uint8x16_t __ret; 37755 __ret = (uint8x16_t)(__p0); 37756 return __ret; 37757 } 37758 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_s64(int64x2_t __p0) { 37759 uint8x16_t __ret; 37760 __ret = (uint8x16_t)(__p0); 37761 return __ret; 37762 } 37763 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_s16(int16x8_t __p0) { 37764 uint8x16_t __ret; 37765 __ret = (uint8x16_t)(__p0); 37766 return __ret; 37767 } 37768 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_p8(poly8x16_t __p0) { 37769 uint32x4_t __ret; 37770 __ret = (uint32x4_t)(__p0); 37771 return __ret; 37772 } 37773 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_p16(poly16x8_t __p0) { 37774 uint32x4_t __ret; 37775 __ret = (uint32x4_t)(__p0); 37776 return __ret; 37777 } 37778 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_u8(uint8x16_t __p0) { 37779 uint32x4_t __ret; 37780 __ret = (uint32x4_t)(__p0); 37781 return __ret; 37782 } 37783 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_u64(uint64x2_t __p0) { 37784 uint32x4_t __ret; 37785 __ret = (uint32x4_t)(__p0); 37786 return __ret; 37787 } 37788 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_u16(uint16x8_t __p0) { 37789 uint32x4_t __ret; 37790 __ret = (uint32x4_t)(__p0); 37791 return __ret; 37792 } 37793 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_s8(int8x16_t __p0) { 37794 uint32x4_t __ret; 37795 __ret = (uint32x4_t)(__p0); 37796 return __ret; 37797 } 37798 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_f32(float32x4_t __p0) { 37799 uint32x4_t __ret; 37800 __ret = (uint32x4_t)(__p0); 37801 return __ret; 37802 } 37803 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_f16(float16x8_t __p0) { 37804 uint32x4_t __ret; 37805 __ret = (uint32x4_t)(__p0); 37806 return __ret; 37807 } 37808 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_s32(int32x4_t __p0) { 37809 uint32x4_t __ret; 37810 __ret = (uint32x4_t)(__p0); 37811 return __ret; 37812 } 37813 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_s64(int64x2_t __p0) { 37814 uint32x4_t __ret; 37815 __ret = (uint32x4_t)(__p0); 37816 return __ret; 37817 } 37818 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_s16(int16x8_t __p0) { 37819 uint32x4_t __ret; 37820 __ret = (uint32x4_t)(__p0); 37821 return __ret; 37822 } 37823 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_p8(poly8x16_t __p0) { 37824 uint64x2_t __ret; 37825 __ret = (uint64x2_t)(__p0); 37826 return __ret; 37827 } 37828 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_p16(poly16x8_t __p0) { 37829 uint64x2_t __ret; 37830 __ret = (uint64x2_t)(__p0); 37831 return __ret; 37832 } 37833 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_u8(uint8x16_t __p0) { 37834 uint64x2_t __ret; 37835 __ret = (uint64x2_t)(__p0); 37836 return __ret; 37837 } 37838 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_u32(uint32x4_t __p0) { 37839 uint64x2_t __ret; 37840 __ret = (uint64x2_t)(__p0); 37841 return __ret; 37842 } 37843 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_u16(uint16x8_t __p0) { 37844 uint64x2_t __ret; 37845 __ret = (uint64x2_t)(__p0); 37846 return __ret; 37847 } 37848 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_s8(int8x16_t __p0) { 37849 uint64x2_t __ret; 37850 __ret = (uint64x2_t)(__p0); 37851 return __ret; 37852 } 37853 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_f32(float32x4_t __p0) { 37854 uint64x2_t __ret; 37855 __ret = (uint64x2_t)(__p0); 37856 return __ret; 37857 } 37858 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_f16(float16x8_t __p0) { 37859 uint64x2_t __ret; 37860 __ret = (uint64x2_t)(__p0); 37861 return __ret; 37862 } 37863 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_s32(int32x4_t __p0) { 37864 uint64x2_t __ret; 37865 __ret = (uint64x2_t)(__p0); 37866 return __ret; 37867 } 37868 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_s64(int64x2_t __p0) { 37869 uint64x2_t __ret; 37870 __ret = (uint64x2_t)(__p0); 37871 return __ret; 37872 } 37873 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_s16(int16x8_t __p0) { 37874 uint64x2_t __ret; 37875 __ret = (uint64x2_t)(__p0); 37876 return __ret; 37877 } 37878 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_p8(poly8x16_t __p0) { 37879 uint16x8_t __ret; 37880 __ret = (uint16x8_t)(__p0); 37881 return __ret; 37882 } 37883 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_p16(poly16x8_t __p0) { 37884 uint16x8_t __ret; 37885 __ret = (uint16x8_t)(__p0); 37886 return __ret; 37887 } 37888 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_u8(uint8x16_t __p0) { 37889 uint16x8_t __ret; 37890 __ret = (uint16x8_t)(__p0); 37891 return __ret; 37892 } 37893 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_u32(uint32x4_t __p0) { 37894 uint16x8_t __ret; 37895 __ret = (uint16x8_t)(__p0); 37896 return __ret; 37897 } 37898 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_u64(uint64x2_t __p0) { 37899 uint16x8_t __ret; 37900 __ret = (uint16x8_t)(__p0); 37901 return __ret; 37902 } 37903 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_s8(int8x16_t __p0) { 37904 uint16x8_t __ret; 37905 __ret = (uint16x8_t)(__p0); 37906 return __ret; 37907 } 37908 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_f32(float32x4_t __p0) { 37909 uint16x8_t __ret; 37910 __ret = (uint16x8_t)(__p0); 37911 return __ret; 37912 } 37913 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_f16(float16x8_t __p0) { 37914 uint16x8_t __ret; 37915 __ret = (uint16x8_t)(__p0); 37916 return __ret; 37917 } 37918 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_s32(int32x4_t __p0) { 37919 uint16x8_t __ret; 37920 __ret = (uint16x8_t)(__p0); 37921 return __ret; 37922 } 37923 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_s64(int64x2_t __p0) { 37924 uint16x8_t __ret; 37925 __ret = (uint16x8_t)(__p0); 37926 return __ret; 37927 } 37928 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_s16(int16x8_t __p0) { 37929 uint16x8_t __ret; 37930 __ret = (uint16x8_t)(__p0); 37931 return __ret; 37932 } 37933 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_p8(poly8x16_t __p0) { 37934 int8x16_t __ret; 37935 __ret = (int8x16_t)(__p0); 37936 return __ret; 37937 } 37938 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_p16(poly16x8_t __p0) { 37939 int8x16_t __ret; 37940 __ret = (int8x16_t)(__p0); 37941 return __ret; 37942 } 37943 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_u8(uint8x16_t __p0) { 37944 int8x16_t __ret; 37945 __ret = (int8x16_t)(__p0); 37946 return __ret; 37947 } 37948 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_u32(uint32x4_t __p0) { 37949 int8x16_t __ret; 37950 __ret = (int8x16_t)(__p0); 37951 return __ret; 37952 } 37953 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_u64(uint64x2_t __p0) { 37954 int8x16_t __ret; 37955 __ret = (int8x16_t)(__p0); 37956 return __ret; 37957 } 37958 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_u16(uint16x8_t __p0) { 37959 int8x16_t __ret; 37960 __ret = (int8x16_t)(__p0); 37961 return __ret; 37962 } 37963 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_f32(float32x4_t __p0) { 37964 int8x16_t __ret; 37965 __ret = (int8x16_t)(__p0); 37966 return __ret; 37967 } 37968 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_f16(float16x8_t __p0) { 37969 int8x16_t __ret; 37970 __ret = (int8x16_t)(__p0); 37971 return __ret; 37972 } 37973 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_s32(int32x4_t __p0) { 37974 int8x16_t __ret; 37975 __ret = (int8x16_t)(__p0); 37976 return __ret; 37977 } 37978 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_s64(int64x2_t __p0) { 37979 int8x16_t __ret; 37980 __ret = (int8x16_t)(__p0); 37981 return __ret; 37982 } 37983 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_s16(int16x8_t __p0) { 37984 int8x16_t __ret; 37985 __ret = (int8x16_t)(__p0); 37986 return __ret; 37987 } 37988 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_p8(poly8x16_t __p0) { 37989 float32x4_t __ret; 37990 __ret = (float32x4_t)(__p0); 37991 return __ret; 37992 } 37993 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_p16(poly16x8_t __p0) { 37994 float32x4_t __ret; 37995 __ret = (float32x4_t)(__p0); 37996 return __ret; 37997 } 37998 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_u8(uint8x16_t __p0) { 37999 float32x4_t __ret; 38000 __ret = (float32x4_t)(__p0); 38001 return __ret; 38002 } 38003 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_u32(uint32x4_t __p0) { 38004 float32x4_t __ret; 38005 __ret = (float32x4_t)(__p0); 38006 return __ret; 38007 } 38008 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_u64(uint64x2_t __p0) { 38009 float32x4_t __ret; 38010 __ret = (float32x4_t)(__p0); 38011 return __ret; 38012 } 38013 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_u16(uint16x8_t __p0) { 38014 float32x4_t __ret; 38015 __ret = (float32x4_t)(__p0); 38016 return __ret; 38017 } 38018 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_s8(int8x16_t __p0) { 38019 float32x4_t __ret; 38020 __ret = (float32x4_t)(__p0); 38021 return __ret; 38022 } 38023 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_f16(float16x8_t __p0) { 38024 float32x4_t __ret; 38025 __ret = (float32x4_t)(__p0); 38026 return __ret; 38027 } 38028 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_s32(int32x4_t __p0) { 38029 float32x4_t __ret; 38030 __ret = (float32x4_t)(__p0); 38031 return __ret; 38032 } 38033 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_s64(int64x2_t __p0) { 38034 float32x4_t __ret; 38035 __ret = (float32x4_t)(__p0); 38036 return __ret; 38037 } 38038 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_s16(int16x8_t __p0) { 38039 float32x4_t __ret; 38040 __ret = (float32x4_t)(__p0); 38041 return __ret; 38042 } 38043 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_p8(poly8x16_t __p0) { 38044 float16x8_t __ret; 38045 __ret = (float16x8_t)(__p0); 38046 return __ret; 38047 } 38048 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_p16(poly16x8_t __p0) { 38049 float16x8_t __ret; 38050 __ret = (float16x8_t)(__p0); 38051 return __ret; 38052 } 38053 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_u8(uint8x16_t __p0) { 38054 float16x8_t __ret; 38055 __ret = (float16x8_t)(__p0); 38056 return __ret; 38057 } 38058 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_u32(uint32x4_t __p0) { 38059 float16x8_t __ret; 38060 __ret = (float16x8_t)(__p0); 38061 return __ret; 38062 } 38063 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_u64(uint64x2_t __p0) { 38064 float16x8_t __ret; 38065 __ret = (float16x8_t)(__p0); 38066 return __ret; 38067 } 38068 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_u16(uint16x8_t __p0) { 38069 float16x8_t __ret; 38070 __ret = (float16x8_t)(__p0); 38071 return __ret; 38072 } 38073 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_s8(int8x16_t __p0) { 38074 float16x8_t __ret; 38075 __ret = (float16x8_t)(__p0); 38076 return __ret; 38077 } 38078 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_f32(float32x4_t __p0) { 38079 float16x8_t __ret; 38080 __ret = (float16x8_t)(__p0); 38081 return __ret; 38082 } 38083 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_s32(int32x4_t __p0) { 38084 float16x8_t __ret; 38085 __ret = (float16x8_t)(__p0); 38086 return __ret; 38087 } 38088 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_s64(int64x2_t __p0) { 38089 float16x8_t __ret; 38090 __ret = (float16x8_t)(__p0); 38091 return __ret; 38092 } 38093 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_s16(int16x8_t __p0) { 38094 float16x8_t __ret; 38095 __ret = (float16x8_t)(__p0); 38096 return __ret; 38097 } 38098 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_p8(poly8x16_t __p0) { 38099 int32x4_t __ret; 38100 __ret = (int32x4_t)(__p0); 38101 return __ret; 38102 } 38103 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_p16(poly16x8_t __p0) { 38104 int32x4_t __ret; 38105 __ret = (int32x4_t)(__p0); 38106 return __ret; 38107 } 38108 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_u8(uint8x16_t __p0) { 38109 int32x4_t __ret; 38110 __ret = (int32x4_t)(__p0); 38111 return __ret; 38112 } 38113 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_u32(uint32x4_t __p0) { 38114 int32x4_t __ret; 38115 __ret = (int32x4_t)(__p0); 38116 return __ret; 38117 } 38118 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_u64(uint64x2_t __p0) { 38119 int32x4_t __ret; 38120 __ret = (int32x4_t)(__p0); 38121 return __ret; 38122 } 38123 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_u16(uint16x8_t __p0) { 38124 int32x4_t __ret; 38125 __ret = (int32x4_t)(__p0); 38126 return __ret; 38127 } 38128 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_s8(int8x16_t __p0) { 38129 int32x4_t __ret; 38130 __ret = (int32x4_t)(__p0); 38131 return __ret; 38132 } 38133 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_f32(float32x4_t __p0) { 38134 int32x4_t __ret; 38135 __ret = (int32x4_t)(__p0); 38136 return __ret; 38137 } 38138 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_f16(float16x8_t __p0) { 38139 int32x4_t __ret; 38140 __ret = (int32x4_t)(__p0); 38141 return __ret; 38142 } 38143 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_s64(int64x2_t __p0) { 38144 int32x4_t __ret; 38145 __ret = (int32x4_t)(__p0); 38146 return __ret; 38147 } 38148 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_s16(int16x8_t __p0) { 38149 int32x4_t __ret; 38150 __ret = (int32x4_t)(__p0); 38151 return __ret; 38152 } 38153 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_p8(poly8x16_t __p0) { 38154 int64x2_t __ret; 38155 __ret = (int64x2_t)(__p0); 38156 return __ret; 38157 } 38158 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_p16(poly16x8_t __p0) { 38159 int64x2_t __ret; 38160 __ret = (int64x2_t)(__p0); 38161 return __ret; 38162 } 38163 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_u8(uint8x16_t __p0) { 38164 int64x2_t __ret; 38165 __ret = (int64x2_t)(__p0); 38166 return __ret; 38167 } 38168 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_u32(uint32x4_t __p0) { 38169 int64x2_t __ret; 38170 __ret = (int64x2_t)(__p0); 38171 return __ret; 38172 } 38173 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_u64(uint64x2_t __p0) { 38174 int64x2_t __ret; 38175 __ret = (int64x2_t)(__p0); 38176 return __ret; 38177 } 38178 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_u16(uint16x8_t __p0) { 38179 int64x2_t __ret; 38180 __ret = (int64x2_t)(__p0); 38181 return __ret; 38182 } 38183 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_s8(int8x16_t __p0) { 38184 int64x2_t __ret; 38185 __ret = (int64x2_t)(__p0); 38186 return __ret; 38187 } 38188 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_f32(float32x4_t __p0) { 38189 int64x2_t __ret; 38190 __ret = (int64x2_t)(__p0); 38191 return __ret; 38192 } 38193 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_f16(float16x8_t __p0) { 38194 int64x2_t __ret; 38195 __ret = (int64x2_t)(__p0); 38196 return __ret; 38197 } 38198 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_s32(int32x4_t __p0) { 38199 int64x2_t __ret; 38200 __ret = (int64x2_t)(__p0); 38201 return __ret; 38202 } 38203 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_s16(int16x8_t __p0) { 38204 int64x2_t __ret; 38205 __ret = (int64x2_t)(__p0); 38206 return __ret; 38207 } 38208 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_p8(poly8x16_t __p0) { 38209 int16x8_t __ret; 38210 __ret = (int16x8_t)(__p0); 38211 return __ret; 38212 } 38213 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_p16(poly16x8_t __p0) { 38214 int16x8_t __ret; 38215 __ret = (int16x8_t)(__p0); 38216 return __ret; 38217 } 38218 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_u8(uint8x16_t __p0) { 38219 int16x8_t __ret; 38220 __ret = (int16x8_t)(__p0); 38221 return __ret; 38222 } 38223 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_u32(uint32x4_t __p0) { 38224 int16x8_t __ret; 38225 __ret = (int16x8_t)(__p0); 38226 return __ret; 38227 } 38228 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_u64(uint64x2_t __p0) { 38229 int16x8_t __ret; 38230 __ret = (int16x8_t)(__p0); 38231 return __ret; 38232 } 38233 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_u16(uint16x8_t __p0) { 38234 int16x8_t __ret; 38235 __ret = (int16x8_t)(__p0); 38236 return __ret; 38237 } 38238 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_s8(int8x16_t __p0) { 38239 int16x8_t __ret; 38240 __ret = (int16x8_t)(__p0); 38241 return __ret; 38242 } 38243 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_f32(float32x4_t __p0) { 38244 int16x8_t __ret; 38245 __ret = (int16x8_t)(__p0); 38246 return __ret; 38247 } 38248 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_f16(float16x8_t __p0) { 38249 int16x8_t __ret; 38250 __ret = (int16x8_t)(__p0); 38251 return __ret; 38252 } 38253 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_s32(int32x4_t __p0) { 38254 int16x8_t __ret; 38255 __ret = (int16x8_t)(__p0); 38256 return __ret; 38257 } 38258 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_s64(int64x2_t __p0) { 38259 int16x8_t __ret; 38260 __ret = (int16x8_t)(__p0); 38261 return __ret; 38262 } 38263 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_p8(poly8x8_t __p0) { 38264 uint8x8_t __ret; 38265 __ret = (uint8x8_t)(__p0); 38266 return __ret; 38267 } 38268 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_p16(poly16x4_t __p0) { 38269 uint8x8_t __ret; 38270 __ret = (uint8x8_t)(__p0); 38271 return __ret; 38272 } 38273 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_u32(uint32x2_t __p0) { 38274 uint8x8_t __ret; 38275 __ret = (uint8x8_t)(__p0); 38276 return __ret; 38277 } 38278 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_u64(uint64x1_t __p0) { 38279 uint8x8_t __ret; 38280 __ret = (uint8x8_t)(__p0); 38281 return __ret; 38282 } 38283 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_u16(uint16x4_t __p0) { 38284 uint8x8_t __ret; 38285 __ret = (uint8x8_t)(__p0); 38286 return __ret; 38287 } 38288 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_s8(int8x8_t __p0) { 38289 uint8x8_t __ret; 38290 __ret = (uint8x8_t)(__p0); 38291 return __ret; 38292 } 38293 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_f32(float32x2_t __p0) { 38294 uint8x8_t __ret; 38295 __ret = (uint8x8_t)(__p0); 38296 return __ret; 38297 } 38298 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_f16(float16x4_t __p0) { 38299 uint8x8_t __ret; 38300 __ret = (uint8x8_t)(__p0); 38301 return __ret; 38302 } 38303 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_s32(int32x2_t __p0) { 38304 uint8x8_t __ret; 38305 __ret = (uint8x8_t)(__p0); 38306 return __ret; 38307 } 38308 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_s64(int64x1_t __p0) { 38309 uint8x8_t __ret; 38310 __ret = (uint8x8_t)(__p0); 38311 return __ret; 38312 } 38313 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_s16(int16x4_t __p0) { 38314 uint8x8_t __ret; 38315 __ret = (uint8x8_t)(__p0); 38316 return __ret; 38317 } 38318 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_p8(poly8x8_t __p0) { 38319 uint32x2_t __ret; 38320 __ret = (uint32x2_t)(__p0); 38321 return __ret; 38322 } 38323 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_p16(poly16x4_t __p0) { 38324 uint32x2_t __ret; 38325 __ret = (uint32x2_t)(__p0); 38326 return __ret; 38327 } 38328 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_u8(uint8x8_t __p0) { 38329 uint32x2_t __ret; 38330 __ret = (uint32x2_t)(__p0); 38331 return __ret; 38332 } 38333 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_u64(uint64x1_t __p0) { 38334 uint32x2_t __ret; 38335 __ret = (uint32x2_t)(__p0); 38336 return __ret; 38337 } 38338 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_u16(uint16x4_t __p0) { 38339 uint32x2_t __ret; 38340 __ret = (uint32x2_t)(__p0); 38341 return __ret; 38342 } 38343 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_s8(int8x8_t __p0) { 38344 uint32x2_t __ret; 38345 __ret = (uint32x2_t)(__p0); 38346 return __ret; 38347 } 38348 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_f32(float32x2_t __p0) { 38349 uint32x2_t __ret; 38350 __ret = (uint32x2_t)(__p0); 38351 return __ret; 38352 } 38353 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_f16(float16x4_t __p0) { 38354 uint32x2_t __ret; 38355 __ret = (uint32x2_t)(__p0); 38356 return __ret; 38357 } 38358 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_s32(int32x2_t __p0) { 38359 uint32x2_t __ret; 38360 __ret = (uint32x2_t)(__p0); 38361 return __ret; 38362 } 38363 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_s64(int64x1_t __p0) { 38364 uint32x2_t __ret; 38365 __ret = (uint32x2_t)(__p0); 38366 return __ret; 38367 } 38368 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_s16(int16x4_t __p0) { 38369 uint32x2_t __ret; 38370 __ret = (uint32x2_t)(__p0); 38371 return __ret; 38372 } 38373 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_p8(poly8x8_t __p0) { 38374 uint64x1_t __ret; 38375 __ret = (uint64x1_t)(__p0); 38376 return __ret; 38377 } 38378 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_p16(poly16x4_t __p0) { 38379 uint64x1_t __ret; 38380 __ret = (uint64x1_t)(__p0); 38381 return __ret; 38382 } 38383 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_u8(uint8x8_t __p0) { 38384 uint64x1_t __ret; 38385 __ret = (uint64x1_t)(__p0); 38386 return __ret; 38387 } 38388 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_u32(uint32x2_t __p0) { 38389 uint64x1_t __ret; 38390 __ret = (uint64x1_t)(__p0); 38391 return __ret; 38392 } 38393 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_u16(uint16x4_t __p0) { 38394 uint64x1_t __ret; 38395 __ret = (uint64x1_t)(__p0); 38396 return __ret; 38397 } 38398 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_s8(int8x8_t __p0) { 38399 uint64x1_t __ret; 38400 __ret = (uint64x1_t)(__p0); 38401 return __ret; 38402 } 38403 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_f32(float32x2_t __p0) { 38404 uint64x1_t __ret; 38405 __ret = (uint64x1_t)(__p0); 38406 return __ret; 38407 } 38408 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_f16(float16x4_t __p0) { 38409 uint64x1_t __ret; 38410 __ret = (uint64x1_t)(__p0); 38411 return __ret; 38412 } 38413 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_s32(int32x2_t __p0) { 38414 uint64x1_t __ret; 38415 __ret = (uint64x1_t)(__p0); 38416 return __ret; 38417 } 38418 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_s64(int64x1_t __p0) { 38419 uint64x1_t __ret; 38420 __ret = (uint64x1_t)(__p0); 38421 return __ret; 38422 } 38423 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_s16(int16x4_t __p0) { 38424 uint64x1_t __ret; 38425 __ret = (uint64x1_t)(__p0); 38426 return __ret; 38427 } 38428 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_p8(poly8x8_t __p0) { 38429 uint16x4_t __ret; 38430 __ret = (uint16x4_t)(__p0); 38431 return __ret; 38432 } 38433 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_p16(poly16x4_t __p0) { 38434 uint16x4_t __ret; 38435 __ret = (uint16x4_t)(__p0); 38436 return __ret; 38437 } 38438 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_u8(uint8x8_t __p0) { 38439 uint16x4_t __ret; 38440 __ret = (uint16x4_t)(__p0); 38441 return __ret; 38442 } 38443 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_u32(uint32x2_t __p0) { 38444 uint16x4_t __ret; 38445 __ret = (uint16x4_t)(__p0); 38446 return __ret; 38447 } 38448 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_u64(uint64x1_t __p0) { 38449 uint16x4_t __ret; 38450 __ret = (uint16x4_t)(__p0); 38451 return __ret; 38452 } 38453 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_s8(int8x8_t __p0) { 38454 uint16x4_t __ret; 38455 __ret = (uint16x4_t)(__p0); 38456 return __ret; 38457 } 38458 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_f32(float32x2_t __p0) { 38459 uint16x4_t __ret; 38460 __ret = (uint16x4_t)(__p0); 38461 return __ret; 38462 } 38463 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_f16(float16x4_t __p0) { 38464 uint16x4_t __ret; 38465 __ret = (uint16x4_t)(__p0); 38466 return __ret; 38467 } 38468 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_s32(int32x2_t __p0) { 38469 uint16x4_t __ret; 38470 __ret = (uint16x4_t)(__p0); 38471 return __ret; 38472 } 38473 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_s64(int64x1_t __p0) { 38474 uint16x4_t __ret; 38475 __ret = (uint16x4_t)(__p0); 38476 return __ret; 38477 } 38478 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_s16(int16x4_t __p0) { 38479 uint16x4_t __ret; 38480 __ret = (uint16x4_t)(__p0); 38481 return __ret; 38482 } 38483 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_p8(poly8x8_t __p0) { 38484 int8x8_t __ret; 38485 __ret = (int8x8_t)(__p0); 38486 return __ret; 38487 } 38488 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_p16(poly16x4_t __p0) { 38489 int8x8_t __ret; 38490 __ret = (int8x8_t)(__p0); 38491 return __ret; 38492 } 38493 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_u8(uint8x8_t __p0) { 38494 int8x8_t __ret; 38495 __ret = (int8x8_t)(__p0); 38496 return __ret; 38497 } 38498 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_u32(uint32x2_t __p0) { 38499 int8x8_t __ret; 38500 __ret = (int8x8_t)(__p0); 38501 return __ret; 38502 } 38503 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_u64(uint64x1_t __p0) { 38504 int8x8_t __ret; 38505 __ret = (int8x8_t)(__p0); 38506 return __ret; 38507 } 38508 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_u16(uint16x4_t __p0) { 38509 int8x8_t __ret; 38510 __ret = (int8x8_t)(__p0); 38511 return __ret; 38512 } 38513 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_f32(float32x2_t __p0) { 38514 int8x8_t __ret; 38515 __ret = (int8x8_t)(__p0); 38516 return __ret; 38517 } 38518 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_f16(float16x4_t __p0) { 38519 int8x8_t __ret; 38520 __ret = (int8x8_t)(__p0); 38521 return __ret; 38522 } 38523 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_s32(int32x2_t __p0) { 38524 int8x8_t __ret; 38525 __ret = (int8x8_t)(__p0); 38526 return __ret; 38527 } 38528 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_s64(int64x1_t __p0) { 38529 int8x8_t __ret; 38530 __ret = (int8x8_t)(__p0); 38531 return __ret; 38532 } 38533 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_s16(int16x4_t __p0) { 38534 int8x8_t __ret; 38535 __ret = (int8x8_t)(__p0); 38536 return __ret; 38537 } 38538 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_p8(poly8x8_t __p0) { 38539 float32x2_t __ret; 38540 __ret = (float32x2_t)(__p0); 38541 return __ret; 38542 } 38543 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_p16(poly16x4_t __p0) { 38544 float32x2_t __ret; 38545 __ret = (float32x2_t)(__p0); 38546 return __ret; 38547 } 38548 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_u8(uint8x8_t __p0) { 38549 float32x2_t __ret; 38550 __ret = (float32x2_t)(__p0); 38551 return __ret; 38552 } 38553 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_u32(uint32x2_t __p0) { 38554 float32x2_t __ret; 38555 __ret = (float32x2_t)(__p0); 38556 return __ret; 38557 } 38558 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_u64(uint64x1_t __p0) { 38559 float32x2_t __ret; 38560 __ret = (float32x2_t)(__p0); 38561 return __ret; 38562 } 38563 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_u16(uint16x4_t __p0) { 38564 float32x2_t __ret; 38565 __ret = (float32x2_t)(__p0); 38566 return __ret; 38567 } 38568 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_s8(int8x8_t __p0) { 38569 float32x2_t __ret; 38570 __ret = (float32x2_t)(__p0); 38571 return __ret; 38572 } 38573 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_f16(float16x4_t __p0) { 38574 float32x2_t __ret; 38575 __ret = (float32x2_t)(__p0); 38576 return __ret; 38577 } 38578 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_s32(int32x2_t __p0) { 38579 float32x2_t __ret; 38580 __ret = (float32x2_t)(__p0); 38581 return __ret; 38582 } 38583 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_s64(int64x1_t __p0) { 38584 float32x2_t __ret; 38585 __ret = (float32x2_t)(__p0); 38586 return __ret; 38587 } 38588 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_s16(int16x4_t __p0) { 38589 float32x2_t __ret; 38590 __ret = (float32x2_t)(__p0); 38591 return __ret; 38592 } 38593 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_p8(poly8x8_t __p0) { 38594 float16x4_t __ret; 38595 __ret = (float16x4_t)(__p0); 38596 return __ret; 38597 } 38598 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_p16(poly16x4_t __p0) { 38599 float16x4_t __ret; 38600 __ret = (float16x4_t)(__p0); 38601 return __ret; 38602 } 38603 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_u8(uint8x8_t __p0) { 38604 float16x4_t __ret; 38605 __ret = (float16x4_t)(__p0); 38606 return __ret; 38607 } 38608 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_u32(uint32x2_t __p0) { 38609 float16x4_t __ret; 38610 __ret = (float16x4_t)(__p0); 38611 return __ret; 38612 } 38613 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_u64(uint64x1_t __p0) { 38614 float16x4_t __ret; 38615 __ret = (float16x4_t)(__p0); 38616 return __ret; 38617 } 38618 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_u16(uint16x4_t __p0) { 38619 float16x4_t __ret; 38620 __ret = (float16x4_t)(__p0); 38621 return __ret; 38622 } 38623 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_s8(int8x8_t __p0) { 38624 float16x4_t __ret; 38625 __ret = (float16x4_t)(__p0); 38626 return __ret; 38627 } 38628 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_f32(float32x2_t __p0) { 38629 float16x4_t __ret; 38630 __ret = (float16x4_t)(__p0); 38631 return __ret; 38632 } 38633 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_s32(int32x2_t __p0) { 38634 float16x4_t __ret; 38635 __ret = (float16x4_t)(__p0); 38636 return __ret; 38637 } 38638 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_s64(int64x1_t __p0) { 38639 float16x4_t __ret; 38640 __ret = (float16x4_t)(__p0); 38641 return __ret; 38642 } 38643 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_s16(int16x4_t __p0) { 38644 float16x4_t __ret; 38645 __ret = (float16x4_t)(__p0); 38646 return __ret; 38647 } 38648 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_p8(poly8x8_t __p0) { 38649 int32x2_t __ret; 38650 __ret = (int32x2_t)(__p0); 38651 return __ret; 38652 } 38653 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_p16(poly16x4_t __p0) { 38654 int32x2_t __ret; 38655 __ret = (int32x2_t)(__p0); 38656 return __ret; 38657 } 38658 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_u8(uint8x8_t __p0) { 38659 int32x2_t __ret; 38660 __ret = (int32x2_t)(__p0); 38661 return __ret; 38662 } 38663 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_u32(uint32x2_t __p0) { 38664 int32x2_t __ret; 38665 __ret = (int32x2_t)(__p0); 38666 return __ret; 38667 } 38668 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_u64(uint64x1_t __p0) { 38669 int32x2_t __ret; 38670 __ret = (int32x2_t)(__p0); 38671 return __ret; 38672 } 38673 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_u16(uint16x4_t __p0) { 38674 int32x2_t __ret; 38675 __ret = (int32x2_t)(__p0); 38676 return __ret; 38677 } 38678 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_s8(int8x8_t __p0) { 38679 int32x2_t __ret; 38680 __ret = (int32x2_t)(__p0); 38681 return __ret; 38682 } 38683 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_f32(float32x2_t __p0) { 38684 int32x2_t __ret; 38685 __ret = (int32x2_t)(__p0); 38686 return __ret; 38687 } 38688 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_f16(float16x4_t __p0) { 38689 int32x2_t __ret; 38690 __ret = (int32x2_t)(__p0); 38691 return __ret; 38692 } 38693 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_s64(int64x1_t __p0) { 38694 int32x2_t __ret; 38695 __ret = (int32x2_t)(__p0); 38696 return __ret; 38697 } 38698 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_s16(int16x4_t __p0) { 38699 int32x2_t __ret; 38700 __ret = (int32x2_t)(__p0); 38701 return __ret; 38702 } 38703 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_p8(poly8x8_t __p0) { 38704 int64x1_t __ret; 38705 __ret = (int64x1_t)(__p0); 38706 return __ret; 38707 } 38708 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_p16(poly16x4_t __p0) { 38709 int64x1_t __ret; 38710 __ret = (int64x1_t)(__p0); 38711 return __ret; 38712 } 38713 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_u8(uint8x8_t __p0) { 38714 int64x1_t __ret; 38715 __ret = (int64x1_t)(__p0); 38716 return __ret; 38717 } 38718 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_u32(uint32x2_t __p0) { 38719 int64x1_t __ret; 38720 __ret = (int64x1_t)(__p0); 38721 return __ret; 38722 } 38723 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_u64(uint64x1_t __p0) { 38724 int64x1_t __ret; 38725 __ret = (int64x1_t)(__p0); 38726 return __ret; 38727 } 38728 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_u16(uint16x4_t __p0) { 38729 int64x1_t __ret; 38730 __ret = (int64x1_t)(__p0); 38731 return __ret; 38732 } 38733 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_s8(int8x8_t __p0) { 38734 int64x1_t __ret; 38735 __ret = (int64x1_t)(__p0); 38736 return __ret; 38737 } 38738 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_f32(float32x2_t __p0) { 38739 int64x1_t __ret; 38740 __ret = (int64x1_t)(__p0); 38741 return __ret; 38742 } 38743 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_f16(float16x4_t __p0) { 38744 int64x1_t __ret; 38745 __ret = (int64x1_t)(__p0); 38746 return __ret; 38747 } 38748 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_s32(int32x2_t __p0) { 38749 int64x1_t __ret; 38750 __ret = (int64x1_t)(__p0); 38751 return __ret; 38752 } 38753 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_s16(int16x4_t __p0) { 38754 int64x1_t __ret; 38755 __ret = (int64x1_t)(__p0); 38756 return __ret; 38757 } 38758 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_p8(poly8x8_t __p0) { 38759 int16x4_t __ret; 38760 __ret = (int16x4_t)(__p0); 38761 return __ret; 38762 } 38763 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_p16(poly16x4_t __p0) { 38764 int16x4_t __ret; 38765 __ret = (int16x4_t)(__p0); 38766 return __ret; 38767 } 38768 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_u8(uint8x8_t __p0) { 38769 int16x4_t __ret; 38770 __ret = (int16x4_t)(__p0); 38771 return __ret; 38772 } 38773 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_u32(uint32x2_t __p0) { 38774 int16x4_t __ret; 38775 __ret = (int16x4_t)(__p0); 38776 return __ret; 38777 } 38778 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_u64(uint64x1_t __p0) { 38779 int16x4_t __ret; 38780 __ret = (int16x4_t)(__p0); 38781 return __ret; 38782 } 38783 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_u16(uint16x4_t __p0) { 38784 int16x4_t __ret; 38785 __ret = (int16x4_t)(__p0); 38786 return __ret; 38787 } 38788 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_s8(int8x8_t __p0) { 38789 int16x4_t __ret; 38790 __ret = (int16x4_t)(__p0); 38791 return __ret; 38792 } 38793 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_f32(float32x2_t __p0) { 38794 int16x4_t __ret; 38795 __ret = (int16x4_t)(__p0); 38796 return __ret; 38797 } 38798 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_f16(float16x4_t __p0) { 38799 int16x4_t __ret; 38800 __ret = (int16x4_t)(__p0); 38801 return __ret; 38802 } 38803 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_s32(int32x2_t __p0) { 38804 int16x4_t __ret; 38805 __ret = (int16x4_t)(__p0); 38806 return __ret; 38807 } 38808 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_s64(int64x1_t __p0) { 38809 int16x4_t __ret; 38810 __ret = (int16x4_t)(__p0); 38811 return __ret; 38812 } 38813 #endif 38814 #if (__ARM_FP & 2) 38815 #ifdef __LITTLE_ENDIAN__ 38816 __ai __attribute__((target("neon"))) float16x4_t vcvt_f16_f32(float32x4_t __p0) { 38817 float16x4_t __ret; 38818 __ret = (float16x4_t) __builtin_neon_vcvt_f16_f32((int8x16_t)__p0, 41); 38819 return __ret; 38820 } 38821 #else 38822 __ai __attribute__((target("neon"))) float16x4_t vcvt_f16_f32(float32x4_t __p0) { 38823 float16x4_t __ret; 38824 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 38825 __ret = (float16x4_t) __builtin_neon_vcvt_f16_f32((int8x16_t)__rev0, 41); 38826 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 38827 return __ret; 38828 } 38829 __ai __attribute__((target("neon"))) float16x4_t __noswap_vcvt_f16_f32(float32x4_t __p0) { 38830 float16x4_t __ret; 38831 __ret = (float16x4_t) __builtin_neon_vcvt_f16_f32((int8x16_t)__p0, 41); 38832 return __ret; 38833 } 38834 #endif 38835 38836 #ifdef __LITTLE_ENDIAN__ 38837 __ai __attribute__((target("neon"))) float32x4_t vcvt_f32_f16(float16x4_t __p0) { 38838 float32x4_t __ret; 38839 __ret = (float32x4_t) __builtin_neon_vcvt_f32_f16((int8x8_t)__p0, 8); 38840 return __ret; 38841 } 38842 #else 38843 __ai __attribute__((target("neon"))) float32x4_t vcvt_f32_f16(float16x4_t __p0) { 38844 float32x4_t __ret; 38845 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 38846 __ret = (float32x4_t) __builtin_neon_vcvt_f32_f16((int8x8_t)__rev0, 8); 38847 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 38848 return __ret; 38849 } 38850 __ai __attribute__((target("neon"))) float32x4_t __noswap_vcvt_f32_f16(float16x4_t __p0) { 38851 float32x4_t __ret; 38852 __ret = (float32x4_t) __builtin_neon_vcvt_f32_f16((int8x8_t)__p0, 8); 38853 return __ret; 38854 } 38855 #endif 38856 38857 #ifdef __LITTLE_ENDIAN__ 38858 #define vld1q_f16(__p0) __extension__ ({ \ 38859 float16x8_t __ret; \ 38860 __ret = (float16x8_t) __builtin_neon_vld1q_v(__p0, 40); \ 38861 __ret; \ 38862 }) 38863 #else 38864 #define vld1q_f16(__p0) __extension__ ({ \ 38865 float16x8_t __ret; \ 38866 __ret = (float16x8_t) __builtin_neon_vld1q_v(__p0, 40); \ 38867 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 38868 __ret; \ 38869 }) 38870 #endif 38871 38872 #ifdef __LITTLE_ENDIAN__ 38873 #define vld1_f16(__p0) __extension__ ({ \ 38874 float16x4_t __ret; \ 38875 __ret = (float16x4_t) __builtin_neon_vld1_v(__p0, 8); \ 38876 __ret; \ 38877 }) 38878 #else 38879 #define vld1_f16(__p0) __extension__ ({ \ 38880 float16x4_t __ret; \ 38881 __ret = (float16x4_t) __builtin_neon_vld1_v(__p0, 8); \ 38882 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 38883 __ret; \ 38884 }) 38885 #endif 38886 38887 #ifdef __LITTLE_ENDIAN__ 38888 #define vld1q_dup_f16(__p0) __extension__ ({ \ 38889 float16x8_t __ret; \ 38890 __ret = (float16x8_t) __builtin_neon_vld1q_dup_v(__p0, 40); \ 38891 __ret; \ 38892 }) 38893 #else 38894 #define vld1q_dup_f16(__p0) __extension__ ({ \ 38895 float16x8_t __ret; \ 38896 __ret = (float16x8_t) __builtin_neon_vld1q_dup_v(__p0, 40); \ 38897 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 38898 __ret; \ 38899 }) 38900 #endif 38901 38902 #ifdef __LITTLE_ENDIAN__ 38903 #define vld1_dup_f16(__p0) __extension__ ({ \ 38904 float16x4_t __ret; \ 38905 __ret = (float16x4_t) __builtin_neon_vld1_dup_v(__p0, 8); \ 38906 __ret; \ 38907 }) 38908 #else 38909 #define vld1_dup_f16(__p0) __extension__ ({ \ 38910 float16x4_t __ret; \ 38911 __ret = (float16x4_t) __builtin_neon_vld1_dup_v(__p0, 8); \ 38912 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 38913 __ret; \ 38914 }) 38915 #endif 38916 38917 #ifdef __LITTLE_ENDIAN__ 38918 #define vld1q_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 38919 float16x8_t __ret; \ 38920 float16x8_t __s1 = __p1; \ 38921 __ret = (float16x8_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__s1, __p2, 40); \ 38922 __ret; \ 38923 }) 38924 #else 38925 #define vld1q_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 38926 float16x8_t __ret; \ 38927 float16x8_t __s1 = __p1; \ 38928 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 38929 __ret = (float16x8_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 40); \ 38930 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 38931 __ret; \ 38932 }) 38933 #endif 38934 38935 #ifdef __LITTLE_ENDIAN__ 38936 #define vld1_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 38937 float16x4_t __ret; \ 38938 float16x4_t __s1 = __p1; \ 38939 __ret = (float16x4_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__s1, __p2, 8); \ 38940 __ret; \ 38941 }) 38942 #else 38943 #define vld1_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 38944 float16x4_t __ret; \ 38945 float16x4_t __s1 = __p1; \ 38946 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 38947 __ret = (float16x4_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__rev1, __p2, 8); \ 38948 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 38949 __ret; \ 38950 }) 38951 #endif 38952 38953 #ifdef __LITTLE_ENDIAN__ 38954 #define vld1q_f16_x2(__p0) __extension__ ({ \ 38955 float16x8x2_t __ret; \ 38956 __builtin_neon_vld1q_x2_v(&__ret, __p0, 40); \ 38957 __ret; \ 38958 }) 38959 #else 38960 #define vld1q_f16_x2(__p0) __extension__ ({ \ 38961 float16x8x2_t __ret; \ 38962 __builtin_neon_vld1q_x2_v(&__ret, __p0, 40); \ 38963 \ 38964 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 38965 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 38966 __ret; \ 38967 }) 38968 #endif 38969 38970 #ifdef __LITTLE_ENDIAN__ 38971 #define vld1_f16_x2(__p0) __extension__ ({ \ 38972 float16x4x2_t __ret; \ 38973 __builtin_neon_vld1_x2_v(&__ret, __p0, 8); \ 38974 __ret; \ 38975 }) 38976 #else 38977 #define vld1_f16_x2(__p0) __extension__ ({ \ 38978 float16x4x2_t __ret; \ 38979 __builtin_neon_vld1_x2_v(&__ret, __p0, 8); \ 38980 \ 38981 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 38982 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 38983 __ret; \ 38984 }) 38985 #endif 38986 38987 #ifdef __LITTLE_ENDIAN__ 38988 #define vld1q_f16_x3(__p0) __extension__ ({ \ 38989 float16x8x3_t __ret; \ 38990 __builtin_neon_vld1q_x3_v(&__ret, __p0, 40); \ 38991 __ret; \ 38992 }) 38993 #else 38994 #define vld1q_f16_x3(__p0) __extension__ ({ \ 38995 float16x8x3_t __ret; \ 38996 __builtin_neon_vld1q_x3_v(&__ret, __p0, 40); \ 38997 \ 38998 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 38999 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 39000 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 39001 __ret; \ 39002 }) 39003 #endif 39004 39005 #ifdef __LITTLE_ENDIAN__ 39006 #define vld1_f16_x3(__p0) __extension__ ({ \ 39007 float16x4x3_t __ret; \ 39008 __builtin_neon_vld1_x3_v(&__ret, __p0, 8); \ 39009 __ret; \ 39010 }) 39011 #else 39012 #define vld1_f16_x3(__p0) __extension__ ({ \ 39013 float16x4x3_t __ret; \ 39014 __builtin_neon_vld1_x3_v(&__ret, __p0, 8); \ 39015 \ 39016 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 39017 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 39018 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 39019 __ret; \ 39020 }) 39021 #endif 39022 39023 #ifdef __LITTLE_ENDIAN__ 39024 #define vld1q_f16_x4(__p0) __extension__ ({ \ 39025 float16x8x4_t __ret; \ 39026 __builtin_neon_vld1q_x4_v(&__ret, __p0, 40); \ 39027 __ret; \ 39028 }) 39029 #else 39030 #define vld1q_f16_x4(__p0) __extension__ ({ \ 39031 float16x8x4_t __ret; \ 39032 __builtin_neon_vld1q_x4_v(&__ret, __p0, 40); \ 39033 \ 39034 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 39035 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 39036 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 39037 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 39038 __ret; \ 39039 }) 39040 #endif 39041 39042 #ifdef __LITTLE_ENDIAN__ 39043 #define vld1_f16_x4(__p0) __extension__ ({ \ 39044 float16x4x4_t __ret; \ 39045 __builtin_neon_vld1_x4_v(&__ret, __p0, 8); \ 39046 __ret; \ 39047 }) 39048 #else 39049 #define vld1_f16_x4(__p0) __extension__ ({ \ 39050 float16x4x4_t __ret; \ 39051 __builtin_neon_vld1_x4_v(&__ret, __p0, 8); \ 39052 \ 39053 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 39054 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 39055 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 39056 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \ 39057 __ret; \ 39058 }) 39059 #endif 39060 39061 #ifdef __LITTLE_ENDIAN__ 39062 #define vld2q_f16(__p0) __extension__ ({ \ 39063 float16x8x2_t __ret; \ 39064 __builtin_neon_vld2q_v(&__ret, __p0, 40); \ 39065 __ret; \ 39066 }) 39067 #else 39068 #define vld2q_f16(__p0) __extension__ ({ \ 39069 float16x8x2_t __ret; \ 39070 __builtin_neon_vld2q_v(&__ret, __p0, 40); \ 39071 \ 39072 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 39073 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 39074 __ret; \ 39075 }) 39076 #endif 39077 39078 #ifdef __LITTLE_ENDIAN__ 39079 #define vld2_f16(__p0) __extension__ ({ \ 39080 float16x4x2_t __ret; \ 39081 __builtin_neon_vld2_v(&__ret, __p0, 8); \ 39082 __ret; \ 39083 }) 39084 #else 39085 #define vld2_f16(__p0) __extension__ ({ \ 39086 float16x4x2_t __ret; \ 39087 __builtin_neon_vld2_v(&__ret, __p0, 8); \ 39088 \ 39089 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 39090 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 39091 __ret; \ 39092 }) 39093 #endif 39094 39095 #ifdef __LITTLE_ENDIAN__ 39096 #define vld2q_dup_f16(__p0) __extension__ ({ \ 39097 float16x8x2_t __ret; \ 39098 __builtin_neon_vld2q_dup_v(&__ret, __p0, 40); \ 39099 __ret; \ 39100 }) 39101 #else 39102 #define vld2q_dup_f16(__p0) __extension__ ({ \ 39103 float16x8x2_t __ret; \ 39104 __builtin_neon_vld2q_dup_v(&__ret, __p0, 40); \ 39105 \ 39106 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 39107 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 39108 __ret; \ 39109 }) 39110 #endif 39111 39112 #ifdef __LITTLE_ENDIAN__ 39113 #define vld2_dup_f16(__p0) __extension__ ({ \ 39114 float16x4x2_t __ret; \ 39115 __builtin_neon_vld2_dup_v(&__ret, __p0, 8); \ 39116 __ret; \ 39117 }) 39118 #else 39119 #define vld2_dup_f16(__p0) __extension__ ({ \ 39120 float16x4x2_t __ret; \ 39121 __builtin_neon_vld2_dup_v(&__ret, __p0, 8); \ 39122 \ 39123 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 39124 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 39125 __ret; \ 39126 }) 39127 #endif 39128 39129 #ifdef __LITTLE_ENDIAN__ 39130 #define vld2q_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 39131 float16x8x2_t __ret; \ 39132 float16x8x2_t __s1 = __p1; \ 39133 __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 40); \ 39134 __ret; \ 39135 }) 39136 #else 39137 #define vld2q_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 39138 float16x8x2_t __ret; \ 39139 float16x8x2_t __s1 = __p1; \ 39140 float16x8x2_t __rev1; \ 39141 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 39142 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 39143 __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 40); \ 39144 \ 39145 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 39146 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 39147 __ret; \ 39148 }) 39149 #endif 39150 39151 #ifdef __LITTLE_ENDIAN__ 39152 #define vld2_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 39153 float16x4x2_t __ret; \ 39154 float16x4x2_t __s1 = __p1; \ 39155 __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 8); \ 39156 __ret; \ 39157 }) 39158 #else 39159 #define vld2_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 39160 float16x4x2_t __ret; \ 39161 float16x4x2_t __s1 = __p1; \ 39162 float16x4x2_t __rev1; \ 39163 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 39164 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 39165 __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 8); \ 39166 \ 39167 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 39168 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 39169 __ret; \ 39170 }) 39171 #endif 39172 39173 #ifdef __LITTLE_ENDIAN__ 39174 #define vld3q_f16(__p0) __extension__ ({ \ 39175 float16x8x3_t __ret; \ 39176 __builtin_neon_vld3q_v(&__ret, __p0, 40); \ 39177 __ret; \ 39178 }) 39179 #else 39180 #define vld3q_f16(__p0) __extension__ ({ \ 39181 float16x8x3_t __ret; \ 39182 __builtin_neon_vld3q_v(&__ret, __p0, 40); \ 39183 \ 39184 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 39185 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 39186 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 39187 __ret; \ 39188 }) 39189 #endif 39190 39191 #ifdef __LITTLE_ENDIAN__ 39192 #define vld3_f16(__p0) __extension__ ({ \ 39193 float16x4x3_t __ret; \ 39194 __builtin_neon_vld3_v(&__ret, __p0, 8); \ 39195 __ret; \ 39196 }) 39197 #else 39198 #define vld3_f16(__p0) __extension__ ({ \ 39199 float16x4x3_t __ret; \ 39200 __builtin_neon_vld3_v(&__ret, __p0, 8); \ 39201 \ 39202 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 39203 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 39204 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 39205 __ret; \ 39206 }) 39207 #endif 39208 39209 #ifdef __LITTLE_ENDIAN__ 39210 #define vld3q_dup_f16(__p0) __extension__ ({ \ 39211 float16x8x3_t __ret; \ 39212 __builtin_neon_vld3q_dup_v(&__ret, __p0, 40); \ 39213 __ret; \ 39214 }) 39215 #else 39216 #define vld3q_dup_f16(__p0) __extension__ ({ \ 39217 float16x8x3_t __ret; \ 39218 __builtin_neon_vld3q_dup_v(&__ret, __p0, 40); \ 39219 \ 39220 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 39221 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 39222 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 39223 __ret; \ 39224 }) 39225 #endif 39226 39227 #ifdef __LITTLE_ENDIAN__ 39228 #define vld3_dup_f16(__p0) __extension__ ({ \ 39229 float16x4x3_t __ret; \ 39230 __builtin_neon_vld3_dup_v(&__ret, __p0, 8); \ 39231 __ret; \ 39232 }) 39233 #else 39234 #define vld3_dup_f16(__p0) __extension__ ({ \ 39235 float16x4x3_t __ret; \ 39236 __builtin_neon_vld3_dup_v(&__ret, __p0, 8); \ 39237 \ 39238 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 39239 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 39240 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 39241 __ret; \ 39242 }) 39243 #endif 39244 39245 #ifdef __LITTLE_ENDIAN__ 39246 #define vld3q_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 39247 float16x8x3_t __ret; \ 39248 float16x8x3_t __s1 = __p1; \ 39249 __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 40); \ 39250 __ret; \ 39251 }) 39252 #else 39253 #define vld3q_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 39254 float16x8x3_t __ret; \ 39255 float16x8x3_t __s1 = __p1; \ 39256 float16x8x3_t __rev1; \ 39257 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 39258 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 39259 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 39260 __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 40); \ 39261 \ 39262 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 39263 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 39264 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 39265 __ret; \ 39266 }) 39267 #endif 39268 39269 #ifdef __LITTLE_ENDIAN__ 39270 #define vld3_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 39271 float16x4x3_t __ret; \ 39272 float16x4x3_t __s1 = __p1; \ 39273 __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 8); \ 39274 __ret; \ 39275 }) 39276 #else 39277 #define vld3_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 39278 float16x4x3_t __ret; \ 39279 float16x4x3_t __s1 = __p1; \ 39280 float16x4x3_t __rev1; \ 39281 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 39282 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 39283 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 39284 __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 8); \ 39285 \ 39286 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 39287 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 39288 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 39289 __ret; \ 39290 }) 39291 #endif 39292 39293 #ifdef __LITTLE_ENDIAN__ 39294 #define vld4q_f16(__p0) __extension__ ({ \ 39295 float16x8x4_t __ret; \ 39296 __builtin_neon_vld4q_v(&__ret, __p0, 40); \ 39297 __ret; \ 39298 }) 39299 #else 39300 #define vld4q_f16(__p0) __extension__ ({ \ 39301 float16x8x4_t __ret; \ 39302 __builtin_neon_vld4q_v(&__ret, __p0, 40); \ 39303 \ 39304 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 39305 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 39306 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 39307 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 39308 __ret; \ 39309 }) 39310 #endif 39311 39312 #ifdef __LITTLE_ENDIAN__ 39313 #define vld4_f16(__p0) __extension__ ({ \ 39314 float16x4x4_t __ret; \ 39315 __builtin_neon_vld4_v(&__ret, __p0, 8); \ 39316 __ret; \ 39317 }) 39318 #else 39319 #define vld4_f16(__p0) __extension__ ({ \ 39320 float16x4x4_t __ret; \ 39321 __builtin_neon_vld4_v(&__ret, __p0, 8); \ 39322 \ 39323 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 39324 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 39325 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 39326 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \ 39327 __ret; \ 39328 }) 39329 #endif 39330 39331 #ifdef __LITTLE_ENDIAN__ 39332 #define vld4q_dup_f16(__p0) __extension__ ({ \ 39333 float16x8x4_t __ret; \ 39334 __builtin_neon_vld4q_dup_v(&__ret, __p0, 40); \ 39335 __ret; \ 39336 }) 39337 #else 39338 #define vld4q_dup_f16(__p0) __extension__ ({ \ 39339 float16x8x4_t __ret; \ 39340 __builtin_neon_vld4q_dup_v(&__ret, __p0, 40); \ 39341 \ 39342 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 39343 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 39344 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 39345 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 39346 __ret; \ 39347 }) 39348 #endif 39349 39350 #ifdef __LITTLE_ENDIAN__ 39351 #define vld4_dup_f16(__p0) __extension__ ({ \ 39352 float16x4x4_t __ret; \ 39353 __builtin_neon_vld4_dup_v(&__ret, __p0, 8); \ 39354 __ret; \ 39355 }) 39356 #else 39357 #define vld4_dup_f16(__p0) __extension__ ({ \ 39358 float16x4x4_t __ret; \ 39359 __builtin_neon_vld4_dup_v(&__ret, __p0, 8); \ 39360 \ 39361 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 39362 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 39363 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 39364 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \ 39365 __ret; \ 39366 }) 39367 #endif 39368 39369 #ifdef __LITTLE_ENDIAN__ 39370 #define vld4q_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 39371 float16x8x4_t __ret; \ 39372 float16x8x4_t __s1 = __p1; \ 39373 __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 40); \ 39374 __ret; \ 39375 }) 39376 #else 39377 #define vld4q_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 39378 float16x8x4_t __ret; \ 39379 float16x8x4_t __s1 = __p1; \ 39380 float16x8x4_t __rev1; \ 39381 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 39382 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 39383 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 39384 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 39385 __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 40); \ 39386 \ 39387 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 39388 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 39389 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 39390 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 39391 __ret; \ 39392 }) 39393 #endif 39394 39395 #ifdef __LITTLE_ENDIAN__ 39396 #define vld4_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 39397 float16x4x4_t __ret; \ 39398 float16x4x4_t __s1 = __p1; \ 39399 __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 8); \ 39400 __ret; \ 39401 }) 39402 #else 39403 #define vld4_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 39404 float16x4x4_t __ret; \ 39405 float16x4x4_t __s1 = __p1; \ 39406 float16x4x4_t __rev1; \ 39407 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 39408 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 39409 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 39410 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \ 39411 __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 8); \ 39412 \ 39413 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 3, 2, 1, 0); \ 39414 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 3, 2, 1, 0); \ 39415 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 3, 2, 1, 0); \ 39416 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 3, 2, 1, 0); \ 39417 __ret; \ 39418 }) 39419 #endif 39420 39421 #ifdef __LITTLE_ENDIAN__ 39422 #define vst1q_f16(__p0, __p1) __extension__ ({ \ 39423 float16x8_t __s1 = __p1; \ 39424 __builtin_neon_vst1q_v(__p0, (int8x16_t)__s1, 40); \ 39425 }) 39426 #else 39427 #define vst1q_f16(__p0, __p1) __extension__ ({ \ 39428 float16x8_t __s1 = __p1; \ 39429 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 39430 __builtin_neon_vst1q_v(__p0, (int8x16_t)__rev1, 40); \ 39431 }) 39432 #endif 39433 39434 #ifdef __LITTLE_ENDIAN__ 39435 #define vst1_f16(__p0, __p1) __extension__ ({ \ 39436 float16x4_t __s1 = __p1; \ 39437 __builtin_neon_vst1_v(__p0, (int8x8_t)__s1, 8); \ 39438 }) 39439 #else 39440 #define vst1_f16(__p0, __p1) __extension__ ({ \ 39441 float16x4_t __s1 = __p1; \ 39442 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 39443 __builtin_neon_vst1_v(__p0, (int8x8_t)__rev1, 8); \ 39444 }) 39445 #endif 39446 39447 #ifdef __LITTLE_ENDIAN__ 39448 #define vst1q_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 39449 float16x8_t __s1 = __p1; \ 39450 __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__s1, __p2, 40); \ 39451 }) 39452 #else 39453 #define vst1q_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 39454 float16x8_t __s1 = __p1; \ 39455 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 39456 __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 40); \ 39457 }) 39458 #endif 39459 39460 #ifdef __LITTLE_ENDIAN__ 39461 #define vst1_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 39462 float16x4_t __s1 = __p1; \ 39463 __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__s1, __p2, 8); \ 39464 }) 39465 #else 39466 #define vst1_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 39467 float16x4_t __s1 = __p1; \ 39468 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 39469 __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__rev1, __p2, 8); \ 39470 }) 39471 #endif 39472 39473 #ifdef __LITTLE_ENDIAN__ 39474 #define vst1q_f16_x2(__p0, __p1) __extension__ ({ \ 39475 float16x8x2_t __s1 = __p1; \ 39476 __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 40); \ 39477 }) 39478 #else 39479 #define vst1q_f16_x2(__p0, __p1) __extension__ ({ \ 39480 float16x8x2_t __s1 = __p1; \ 39481 float16x8x2_t __rev1; \ 39482 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 39483 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 39484 __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 40); \ 39485 }) 39486 #endif 39487 39488 #ifdef __LITTLE_ENDIAN__ 39489 #define vst1_f16_x2(__p0, __p1) __extension__ ({ \ 39490 float16x4x2_t __s1 = __p1; \ 39491 __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 8); \ 39492 }) 39493 #else 39494 #define vst1_f16_x2(__p0, __p1) __extension__ ({ \ 39495 float16x4x2_t __s1 = __p1; \ 39496 float16x4x2_t __rev1; \ 39497 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 39498 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 39499 __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 8); \ 39500 }) 39501 #endif 39502 39503 #ifdef __LITTLE_ENDIAN__ 39504 #define vst1q_f16_x3(__p0, __p1) __extension__ ({ \ 39505 float16x8x3_t __s1 = __p1; \ 39506 __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 40); \ 39507 }) 39508 #else 39509 #define vst1q_f16_x3(__p0, __p1) __extension__ ({ \ 39510 float16x8x3_t __s1 = __p1; \ 39511 float16x8x3_t __rev1; \ 39512 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 39513 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 39514 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 39515 __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 40); \ 39516 }) 39517 #endif 39518 39519 #ifdef __LITTLE_ENDIAN__ 39520 #define vst1_f16_x3(__p0, __p1) __extension__ ({ \ 39521 float16x4x3_t __s1 = __p1; \ 39522 __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 8); \ 39523 }) 39524 #else 39525 #define vst1_f16_x3(__p0, __p1) __extension__ ({ \ 39526 float16x4x3_t __s1 = __p1; \ 39527 float16x4x3_t __rev1; \ 39528 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 39529 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 39530 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 39531 __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 8); \ 39532 }) 39533 #endif 39534 39535 #ifdef __LITTLE_ENDIAN__ 39536 #define vst1q_f16_x4(__p0, __p1) __extension__ ({ \ 39537 float16x8x4_t __s1 = __p1; \ 39538 __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 40); \ 39539 }) 39540 #else 39541 #define vst1q_f16_x4(__p0, __p1) __extension__ ({ \ 39542 float16x8x4_t __s1 = __p1; \ 39543 float16x8x4_t __rev1; \ 39544 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 39545 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 39546 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 39547 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 39548 __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 40); \ 39549 }) 39550 #endif 39551 39552 #ifdef __LITTLE_ENDIAN__ 39553 #define vst1_f16_x4(__p0, __p1) __extension__ ({ \ 39554 float16x4x4_t __s1 = __p1; \ 39555 __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 8); \ 39556 }) 39557 #else 39558 #define vst1_f16_x4(__p0, __p1) __extension__ ({ \ 39559 float16x4x4_t __s1 = __p1; \ 39560 float16x4x4_t __rev1; \ 39561 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 39562 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 39563 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 39564 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \ 39565 __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 8); \ 39566 }) 39567 #endif 39568 39569 #ifdef __LITTLE_ENDIAN__ 39570 #define vst2q_f16(__p0, __p1) __extension__ ({ \ 39571 float16x8x2_t __s1 = __p1; \ 39572 __builtin_neon_vst2q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 40); \ 39573 }) 39574 #else 39575 #define vst2q_f16(__p0, __p1) __extension__ ({ \ 39576 float16x8x2_t __s1 = __p1; \ 39577 float16x8x2_t __rev1; \ 39578 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 39579 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 39580 __builtin_neon_vst2q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 40); \ 39581 }) 39582 #endif 39583 39584 #ifdef __LITTLE_ENDIAN__ 39585 #define vst2_f16(__p0, __p1) __extension__ ({ \ 39586 float16x4x2_t __s1 = __p1; \ 39587 __builtin_neon_vst2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 8); \ 39588 }) 39589 #else 39590 #define vst2_f16(__p0, __p1) __extension__ ({ \ 39591 float16x4x2_t __s1 = __p1; \ 39592 float16x4x2_t __rev1; \ 39593 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 39594 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 39595 __builtin_neon_vst2_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], 8); \ 39596 }) 39597 #endif 39598 39599 #ifdef __LITTLE_ENDIAN__ 39600 #define vst2q_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 39601 float16x8x2_t __s1 = __p1; \ 39602 __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 40); \ 39603 }) 39604 #else 39605 #define vst2q_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 39606 float16x8x2_t __s1 = __p1; \ 39607 float16x8x2_t __rev1; \ 39608 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 39609 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 39610 __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 40); \ 39611 }) 39612 #endif 39613 39614 #ifdef __LITTLE_ENDIAN__ 39615 #define vst2_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 39616 float16x4x2_t __s1 = __p1; \ 39617 __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 8); \ 39618 }) 39619 #else 39620 #define vst2_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 39621 float16x4x2_t __s1 = __p1; \ 39622 float16x4x2_t __rev1; \ 39623 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 39624 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 39625 __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], __p2, 8); \ 39626 }) 39627 #endif 39628 39629 #ifdef __LITTLE_ENDIAN__ 39630 #define vst3q_f16(__p0, __p1) __extension__ ({ \ 39631 float16x8x3_t __s1 = __p1; \ 39632 __builtin_neon_vst3q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 40); \ 39633 }) 39634 #else 39635 #define vst3q_f16(__p0, __p1) __extension__ ({ \ 39636 float16x8x3_t __s1 = __p1; \ 39637 float16x8x3_t __rev1; \ 39638 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 39639 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 39640 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 39641 __builtin_neon_vst3q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 40); \ 39642 }) 39643 #endif 39644 39645 #ifdef __LITTLE_ENDIAN__ 39646 #define vst3_f16(__p0, __p1) __extension__ ({ \ 39647 float16x4x3_t __s1 = __p1; \ 39648 __builtin_neon_vst3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 8); \ 39649 }) 39650 #else 39651 #define vst3_f16(__p0, __p1) __extension__ ({ \ 39652 float16x4x3_t __s1 = __p1; \ 39653 float16x4x3_t __rev1; \ 39654 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 39655 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 39656 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 39657 __builtin_neon_vst3_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], 8); \ 39658 }) 39659 #endif 39660 39661 #ifdef __LITTLE_ENDIAN__ 39662 #define vst3q_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 39663 float16x8x3_t __s1 = __p1; \ 39664 __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 40); \ 39665 }) 39666 #else 39667 #define vst3q_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 39668 float16x8x3_t __s1 = __p1; \ 39669 float16x8x3_t __rev1; \ 39670 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 39671 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 39672 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 39673 __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 40); \ 39674 }) 39675 #endif 39676 39677 #ifdef __LITTLE_ENDIAN__ 39678 #define vst3_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 39679 float16x4x3_t __s1 = __p1; \ 39680 __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 8); \ 39681 }) 39682 #else 39683 #define vst3_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 39684 float16x4x3_t __s1 = __p1; \ 39685 float16x4x3_t __rev1; \ 39686 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 39687 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 39688 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 39689 __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], __p2, 8); \ 39690 }) 39691 #endif 39692 39693 #ifdef __LITTLE_ENDIAN__ 39694 #define vst4q_f16(__p0, __p1) __extension__ ({ \ 39695 float16x8x4_t __s1 = __p1; \ 39696 __builtin_neon_vst4q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 40); \ 39697 }) 39698 #else 39699 #define vst4q_f16(__p0, __p1) __extension__ ({ \ 39700 float16x8x4_t __s1 = __p1; \ 39701 float16x8x4_t __rev1; \ 39702 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 39703 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 39704 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 39705 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 39706 __builtin_neon_vst4q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 40); \ 39707 }) 39708 #endif 39709 39710 #ifdef __LITTLE_ENDIAN__ 39711 #define vst4_f16(__p0, __p1) __extension__ ({ \ 39712 float16x4x4_t __s1 = __p1; \ 39713 __builtin_neon_vst4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 8); \ 39714 }) 39715 #else 39716 #define vst4_f16(__p0, __p1) __extension__ ({ \ 39717 float16x4x4_t __s1 = __p1; \ 39718 float16x4x4_t __rev1; \ 39719 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 39720 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 39721 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 39722 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \ 39723 __builtin_neon_vst4_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], 8); \ 39724 }) 39725 #endif 39726 39727 #ifdef __LITTLE_ENDIAN__ 39728 #define vst4q_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 39729 float16x8x4_t __s1 = __p1; \ 39730 __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 40); \ 39731 }) 39732 #else 39733 #define vst4q_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 39734 float16x8x4_t __s1 = __p1; \ 39735 float16x8x4_t __rev1; \ 39736 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 39737 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 39738 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 7, 6, 5, 4, 3, 2, 1, 0); \ 39739 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 7, 6, 5, 4, 3, 2, 1, 0); \ 39740 __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 40); \ 39741 }) 39742 #endif 39743 39744 #ifdef __LITTLE_ENDIAN__ 39745 #define vst4_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 39746 float16x4x4_t __s1 = __p1; \ 39747 __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 8); \ 39748 }) 39749 #else 39750 #define vst4_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 39751 float16x4x4_t __s1 = __p1; \ 39752 float16x4x4_t __rev1; \ 39753 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 3, 2, 1, 0); \ 39754 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 3, 2, 1, 0); \ 39755 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 3, 2, 1, 0); \ 39756 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 3, 2, 1, 0); \ 39757 __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__rev1.val[0], (int8x8_t)__rev1.val[1], (int8x8_t)__rev1.val[2], (int8x8_t)__rev1.val[3], __p2, 8); \ 39758 }) 39759 #endif 39760 39761 #endif 39762 #if (defined(__aarch64__) || defined(__arm64ec__)) && defined(__ARM_FEATURE_NUMERIC_MAXMIN) 39763 #ifdef __LITTLE_ENDIAN__ 39764 __ai __attribute__((target("neon"))) float64x2_t vmaxnmq_f64(float64x2_t __p0, float64x2_t __p1) { 39765 float64x2_t __ret; 39766 __ret = (float64x2_t) __builtin_neon_vmaxnmq_v((int8x16_t)__p0, (int8x16_t)__p1, 42); 39767 return __ret; 39768 } 39769 #else 39770 __ai __attribute__((target("neon"))) float64x2_t vmaxnmq_f64(float64x2_t __p0, float64x2_t __p1) { 39771 float64x2_t __ret; 39772 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 39773 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 39774 __ret = (float64x2_t) __builtin_neon_vmaxnmq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 42); 39775 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 39776 return __ret; 39777 } 39778 #endif 39779 39780 __ai __attribute__((target("neon"))) float64x1_t vmaxnm_f64(float64x1_t __p0, float64x1_t __p1) { 39781 float64x1_t __ret; 39782 __ret = (float64x1_t) __builtin_neon_vmaxnm_v((int8x8_t)__p0, (int8x8_t)__p1, 10); 39783 return __ret; 39784 } 39785 #ifdef __LITTLE_ENDIAN__ 39786 __ai __attribute__((target("neon"))) float64x2_t vminnmq_f64(float64x2_t __p0, float64x2_t __p1) { 39787 float64x2_t __ret; 39788 __ret = (float64x2_t) __builtin_neon_vminnmq_v((int8x16_t)__p0, (int8x16_t)__p1, 42); 39789 return __ret; 39790 } 39791 #else 39792 __ai __attribute__((target("neon"))) float64x2_t vminnmq_f64(float64x2_t __p0, float64x2_t __p1) { 39793 float64x2_t __ret; 39794 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 39795 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 39796 __ret = (float64x2_t) __builtin_neon_vminnmq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 42); 39797 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 39798 return __ret; 39799 } 39800 #endif 39801 39802 __ai __attribute__((target("neon"))) float64x1_t vminnm_f64(float64x1_t __p0, float64x1_t __p1) { 39803 float64x1_t __ret; 39804 __ret = (float64x1_t) __builtin_neon_vminnm_v((int8x8_t)__p0, (int8x8_t)__p1, 10); 39805 return __ret; 39806 } 39807 #endif 39808 #if (defined(__aarch64__) || defined(__arm64ec__)) && defined(__ARM_FEATURE_DIRECTED_ROUNDING) 39809 #ifdef __LITTLE_ENDIAN__ 39810 __ai __attribute__((target("neon"))) float64x2_t vrndq_f64(float64x2_t __p0) { 39811 float64x2_t __ret; 39812 __ret = (float64x2_t) __builtin_neon_vrndq_v((int8x16_t)__p0, 42); 39813 return __ret; 39814 } 39815 #else 39816 __ai __attribute__((target("neon"))) float64x2_t vrndq_f64(float64x2_t __p0) { 39817 float64x2_t __ret; 39818 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 39819 __ret = (float64x2_t) __builtin_neon_vrndq_v((int8x16_t)__rev0, 42); 39820 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 39821 return __ret; 39822 } 39823 #endif 39824 39825 __ai __attribute__((target("neon"))) float64x1_t vrnd_f64(float64x1_t __p0) { 39826 float64x1_t __ret; 39827 __ret = (float64x1_t) __builtin_neon_vrnd_v((int8x8_t)__p0, 10); 39828 return __ret; 39829 } 39830 #ifdef __LITTLE_ENDIAN__ 39831 __ai __attribute__((target("neon"))) float64x2_t vrndaq_f64(float64x2_t __p0) { 39832 float64x2_t __ret; 39833 __ret = (float64x2_t) __builtin_neon_vrndaq_v((int8x16_t)__p0, 42); 39834 return __ret; 39835 } 39836 #else 39837 __ai __attribute__((target("neon"))) float64x2_t vrndaq_f64(float64x2_t __p0) { 39838 float64x2_t __ret; 39839 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 39840 __ret = (float64x2_t) __builtin_neon_vrndaq_v((int8x16_t)__rev0, 42); 39841 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 39842 return __ret; 39843 } 39844 #endif 39845 39846 __ai __attribute__((target("neon"))) float64x1_t vrnda_f64(float64x1_t __p0) { 39847 float64x1_t __ret; 39848 __ret = (float64x1_t) __builtin_neon_vrnda_v((int8x8_t)__p0, 10); 39849 return __ret; 39850 } 39851 #ifdef __LITTLE_ENDIAN__ 39852 __ai __attribute__((target("neon"))) float64x2_t vrndiq_f64(float64x2_t __p0) { 39853 float64x2_t __ret; 39854 __ret = (float64x2_t) __builtin_neon_vrndiq_v((int8x16_t)__p0, 42); 39855 return __ret; 39856 } 39857 #else 39858 __ai __attribute__((target("neon"))) float64x2_t vrndiq_f64(float64x2_t __p0) { 39859 float64x2_t __ret; 39860 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 39861 __ret = (float64x2_t) __builtin_neon_vrndiq_v((int8x16_t)__rev0, 42); 39862 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 39863 return __ret; 39864 } 39865 #endif 39866 39867 __ai __attribute__((target("neon"))) float64x1_t vrndi_f64(float64x1_t __p0) { 39868 float64x1_t __ret; 39869 __ret = (float64x1_t) __builtin_neon_vrndi_v((int8x8_t)__p0, 10); 39870 return __ret; 39871 } 39872 #ifdef __LITTLE_ENDIAN__ 39873 __ai __attribute__((target("neon"))) float64x2_t vrndmq_f64(float64x2_t __p0) { 39874 float64x2_t __ret; 39875 __ret = (float64x2_t) __builtin_neon_vrndmq_v((int8x16_t)__p0, 42); 39876 return __ret; 39877 } 39878 #else 39879 __ai __attribute__((target("neon"))) float64x2_t vrndmq_f64(float64x2_t __p0) { 39880 float64x2_t __ret; 39881 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 39882 __ret = (float64x2_t) __builtin_neon_vrndmq_v((int8x16_t)__rev0, 42); 39883 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 39884 return __ret; 39885 } 39886 #endif 39887 39888 __ai __attribute__((target("neon"))) float64x1_t vrndm_f64(float64x1_t __p0) { 39889 float64x1_t __ret; 39890 __ret = (float64x1_t) __builtin_neon_vrndm_v((int8x8_t)__p0, 10); 39891 return __ret; 39892 } 39893 #ifdef __LITTLE_ENDIAN__ 39894 __ai __attribute__((target("neon"))) float64x2_t vrndnq_f64(float64x2_t __p0) { 39895 float64x2_t __ret; 39896 __ret = (float64x2_t) __builtin_neon_vrndnq_v((int8x16_t)__p0, 42); 39897 return __ret; 39898 } 39899 #else 39900 __ai __attribute__((target("neon"))) float64x2_t vrndnq_f64(float64x2_t __p0) { 39901 float64x2_t __ret; 39902 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 39903 __ret = (float64x2_t) __builtin_neon_vrndnq_v((int8x16_t)__rev0, 42); 39904 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 39905 return __ret; 39906 } 39907 #endif 39908 39909 __ai __attribute__((target("neon"))) float64x1_t vrndn_f64(float64x1_t __p0) { 39910 float64x1_t __ret; 39911 __ret = (float64x1_t) __builtin_neon_vrndn_v((int8x8_t)__p0, 10); 39912 return __ret; 39913 } 39914 #ifdef __LITTLE_ENDIAN__ 39915 __ai __attribute__((target("neon"))) float64x2_t vrndpq_f64(float64x2_t __p0) { 39916 float64x2_t __ret; 39917 __ret = (float64x2_t) __builtin_neon_vrndpq_v((int8x16_t)__p0, 42); 39918 return __ret; 39919 } 39920 #else 39921 __ai __attribute__((target("neon"))) float64x2_t vrndpq_f64(float64x2_t __p0) { 39922 float64x2_t __ret; 39923 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 39924 __ret = (float64x2_t) __builtin_neon_vrndpq_v((int8x16_t)__rev0, 42); 39925 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 39926 return __ret; 39927 } 39928 #endif 39929 39930 __ai __attribute__((target("neon"))) float64x1_t vrndp_f64(float64x1_t __p0) { 39931 float64x1_t __ret; 39932 __ret = (float64x1_t) __builtin_neon_vrndp_v((int8x8_t)__p0, 10); 39933 return __ret; 39934 } 39935 #ifdef __LITTLE_ENDIAN__ 39936 __ai __attribute__((target("neon"))) float64x2_t vrndxq_f64(float64x2_t __p0) { 39937 float64x2_t __ret; 39938 __ret = (float64x2_t) __builtin_neon_vrndxq_v((int8x16_t)__p0, 42); 39939 return __ret; 39940 } 39941 #else 39942 __ai __attribute__((target("neon"))) float64x2_t vrndxq_f64(float64x2_t __p0) { 39943 float64x2_t __ret; 39944 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 39945 __ret = (float64x2_t) __builtin_neon_vrndxq_v((int8x16_t)__rev0, 42); 39946 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 39947 return __ret; 39948 } 39949 #endif 39950 39951 __ai __attribute__((target("neon"))) float64x1_t vrndx_f64(float64x1_t __p0) { 39952 float64x1_t __ret; 39953 __ret = (float64x1_t) __builtin_neon_vrndx_v((int8x8_t)__p0, 10); 39954 return __ret; 39955 } 39956 #endif 39957 #if __ARM_ARCH >= 8 39958 #ifdef __LITTLE_ENDIAN__ 39959 __ai __attribute__((target("aes,neon"))) uint8x16_t vaesdq_u8(uint8x16_t __p0, uint8x16_t __p1) { 39960 uint8x16_t __ret; 39961 __ret = (uint8x16_t) __builtin_neon_vaesdq_u8((int8x16_t)__p0, (int8x16_t)__p1, 48); 39962 return __ret; 39963 } 39964 #else 39965 __ai __attribute__((target("aes,neon"))) uint8x16_t vaesdq_u8(uint8x16_t __p0, uint8x16_t __p1) { 39966 uint8x16_t __ret; 39967 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 39968 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 39969 __ret = (uint8x16_t) __builtin_neon_vaesdq_u8((int8x16_t)__rev0, (int8x16_t)__rev1, 48); 39970 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 39971 return __ret; 39972 } 39973 #endif 39974 39975 #ifdef __LITTLE_ENDIAN__ 39976 __ai __attribute__((target("aes,neon"))) uint8x16_t vaeseq_u8(uint8x16_t __p0, uint8x16_t __p1) { 39977 uint8x16_t __ret; 39978 __ret = (uint8x16_t) __builtin_neon_vaeseq_u8((int8x16_t)__p0, (int8x16_t)__p1, 48); 39979 return __ret; 39980 } 39981 #else 39982 __ai __attribute__((target("aes,neon"))) uint8x16_t vaeseq_u8(uint8x16_t __p0, uint8x16_t __p1) { 39983 uint8x16_t __ret; 39984 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 39985 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 39986 __ret = (uint8x16_t) __builtin_neon_vaeseq_u8((int8x16_t)__rev0, (int8x16_t)__rev1, 48); 39987 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 39988 return __ret; 39989 } 39990 #endif 39991 39992 #ifdef __LITTLE_ENDIAN__ 39993 __ai __attribute__((target("aes,neon"))) uint8x16_t vaesimcq_u8(uint8x16_t __p0) { 39994 uint8x16_t __ret; 39995 __ret = (uint8x16_t) __builtin_neon_vaesimcq_u8((int8x16_t)__p0, 48); 39996 return __ret; 39997 } 39998 #else 39999 __ai __attribute__((target("aes,neon"))) uint8x16_t vaesimcq_u8(uint8x16_t __p0) { 40000 uint8x16_t __ret; 40001 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 40002 __ret = (uint8x16_t) __builtin_neon_vaesimcq_u8((int8x16_t)__rev0, 48); 40003 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 40004 return __ret; 40005 } 40006 #endif 40007 40008 #ifdef __LITTLE_ENDIAN__ 40009 __ai __attribute__((target("aes,neon"))) uint8x16_t vaesmcq_u8(uint8x16_t __p0) { 40010 uint8x16_t __ret; 40011 __ret = (uint8x16_t) __builtin_neon_vaesmcq_u8((int8x16_t)__p0, 48); 40012 return __ret; 40013 } 40014 #else 40015 __ai __attribute__((target("aes,neon"))) uint8x16_t vaesmcq_u8(uint8x16_t __p0) { 40016 uint8x16_t __ret; 40017 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 40018 __ret = (uint8x16_t) __builtin_neon_vaesmcq_u8((int8x16_t)__rev0, 48); 40019 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 40020 return __ret; 40021 } 40022 #endif 40023 40024 #ifdef __LITTLE_ENDIAN__ 40025 __ai __attribute__((target("neon"))) int32x4_t vcvtaq_s32_f32(float32x4_t __p0) { 40026 int32x4_t __ret; 40027 __ret = (int32x4_t) __builtin_neon_vcvtaq_s32_v((int8x16_t)__p0, 34); 40028 return __ret; 40029 } 40030 #else 40031 __ai __attribute__((target("neon"))) int32x4_t vcvtaq_s32_f32(float32x4_t __p0) { 40032 int32x4_t __ret; 40033 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40034 __ret = (int32x4_t) __builtin_neon_vcvtaq_s32_v((int8x16_t)__rev0, 34); 40035 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40036 return __ret; 40037 } 40038 #endif 40039 40040 #ifdef __LITTLE_ENDIAN__ 40041 __ai __attribute__((target("neon"))) int32x2_t vcvta_s32_f32(float32x2_t __p0) { 40042 int32x2_t __ret; 40043 __ret = (int32x2_t) __builtin_neon_vcvta_s32_v((int8x8_t)__p0, 2); 40044 return __ret; 40045 } 40046 #else 40047 __ai __attribute__((target("neon"))) int32x2_t vcvta_s32_f32(float32x2_t __p0) { 40048 int32x2_t __ret; 40049 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 40050 __ret = (int32x2_t) __builtin_neon_vcvta_s32_v((int8x8_t)__rev0, 2); 40051 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 40052 return __ret; 40053 } 40054 #endif 40055 40056 #ifdef __LITTLE_ENDIAN__ 40057 __ai __attribute__((target("neon"))) uint32x4_t vcvtaq_u32_f32(float32x4_t __p0) { 40058 uint32x4_t __ret; 40059 __ret = (uint32x4_t) __builtin_neon_vcvtaq_u32_v((int8x16_t)__p0, 50); 40060 return __ret; 40061 } 40062 #else 40063 __ai __attribute__((target("neon"))) uint32x4_t vcvtaq_u32_f32(float32x4_t __p0) { 40064 uint32x4_t __ret; 40065 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40066 __ret = (uint32x4_t) __builtin_neon_vcvtaq_u32_v((int8x16_t)__rev0, 50); 40067 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40068 return __ret; 40069 } 40070 #endif 40071 40072 #ifdef __LITTLE_ENDIAN__ 40073 __ai __attribute__((target("neon"))) uint32x2_t vcvta_u32_f32(float32x2_t __p0) { 40074 uint32x2_t __ret; 40075 __ret = (uint32x2_t) __builtin_neon_vcvta_u32_v((int8x8_t)__p0, 18); 40076 return __ret; 40077 } 40078 #else 40079 __ai __attribute__((target("neon"))) uint32x2_t vcvta_u32_f32(float32x2_t __p0) { 40080 uint32x2_t __ret; 40081 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 40082 __ret = (uint32x2_t) __builtin_neon_vcvta_u32_v((int8x8_t)__rev0, 18); 40083 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 40084 return __ret; 40085 } 40086 #endif 40087 40088 #ifdef __LITTLE_ENDIAN__ 40089 __ai __attribute__((target("neon"))) int32x4_t vcvtmq_s32_f32(float32x4_t __p0) { 40090 int32x4_t __ret; 40091 __ret = (int32x4_t) __builtin_neon_vcvtmq_s32_v((int8x16_t)__p0, 34); 40092 return __ret; 40093 } 40094 #else 40095 __ai __attribute__((target("neon"))) int32x4_t vcvtmq_s32_f32(float32x4_t __p0) { 40096 int32x4_t __ret; 40097 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40098 __ret = (int32x4_t) __builtin_neon_vcvtmq_s32_v((int8x16_t)__rev0, 34); 40099 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40100 return __ret; 40101 } 40102 #endif 40103 40104 #ifdef __LITTLE_ENDIAN__ 40105 __ai __attribute__((target("neon"))) int32x2_t vcvtm_s32_f32(float32x2_t __p0) { 40106 int32x2_t __ret; 40107 __ret = (int32x2_t) __builtin_neon_vcvtm_s32_v((int8x8_t)__p0, 2); 40108 return __ret; 40109 } 40110 #else 40111 __ai __attribute__((target("neon"))) int32x2_t vcvtm_s32_f32(float32x2_t __p0) { 40112 int32x2_t __ret; 40113 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 40114 __ret = (int32x2_t) __builtin_neon_vcvtm_s32_v((int8x8_t)__rev0, 2); 40115 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 40116 return __ret; 40117 } 40118 #endif 40119 40120 #ifdef __LITTLE_ENDIAN__ 40121 __ai __attribute__((target("neon"))) uint32x4_t vcvtmq_u32_f32(float32x4_t __p0) { 40122 uint32x4_t __ret; 40123 __ret = (uint32x4_t) __builtin_neon_vcvtmq_u32_v((int8x16_t)__p0, 50); 40124 return __ret; 40125 } 40126 #else 40127 __ai __attribute__((target("neon"))) uint32x4_t vcvtmq_u32_f32(float32x4_t __p0) { 40128 uint32x4_t __ret; 40129 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40130 __ret = (uint32x4_t) __builtin_neon_vcvtmq_u32_v((int8x16_t)__rev0, 50); 40131 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40132 return __ret; 40133 } 40134 #endif 40135 40136 #ifdef __LITTLE_ENDIAN__ 40137 __ai __attribute__((target("neon"))) uint32x2_t vcvtm_u32_f32(float32x2_t __p0) { 40138 uint32x2_t __ret; 40139 __ret = (uint32x2_t) __builtin_neon_vcvtm_u32_v((int8x8_t)__p0, 18); 40140 return __ret; 40141 } 40142 #else 40143 __ai __attribute__((target("neon"))) uint32x2_t vcvtm_u32_f32(float32x2_t __p0) { 40144 uint32x2_t __ret; 40145 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 40146 __ret = (uint32x2_t) __builtin_neon_vcvtm_u32_v((int8x8_t)__rev0, 18); 40147 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 40148 return __ret; 40149 } 40150 #endif 40151 40152 #ifdef __LITTLE_ENDIAN__ 40153 __ai __attribute__((target("neon"))) int32x4_t vcvtnq_s32_f32(float32x4_t __p0) { 40154 int32x4_t __ret; 40155 __ret = (int32x4_t) __builtin_neon_vcvtnq_s32_v((int8x16_t)__p0, 34); 40156 return __ret; 40157 } 40158 #else 40159 __ai __attribute__((target("neon"))) int32x4_t vcvtnq_s32_f32(float32x4_t __p0) { 40160 int32x4_t __ret; 40161 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40162 __ret = (int32x4_t) __builtin_neon_vcvtnq_s32_v((int8x16_t)__rev0, 34); 40163 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40164 return __ret; 40165 } 40166 #endif 40167 40168 #ifdef __LITTLE_ENDIAN__ 40169 __ai __attribute__((target("neon"))) int32x2_t vcvtn_s32_f32(float32x2_t __p0) { 40170 int32x2_t __ret; 40171 __ret = (int32x2_t) __builtin_neon_vcvtn_s32_v((int8x8_t)__p0, 2); 40172 return __ret; 40173 } 40174 #else 40175 __ai __attribute__((target("neon"))) int32x2_t vcvtn_s32_f32(float32x2_t __p0) { 40176 int32x2_t __ret; 40177 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 40178 __ret = (int32x2_t) __builtin_neon_vcvtn_s32_v((int8x8_t)__rev0, 2); 40179 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 40180 return __ret; 40181 } 40182 #endif 40183 40184 #ifdef __LITTLE_ENDIAN__ 40185 __ai __attribute__((target("neon"))) uint32x4_t vcvtnq_u32_f32(float32x4_t __p0) { 40186 uint32x4_t __ret; 40187 __ret = (uint32x4_t) __builtin_neon_vcvtnq_u32_v((int8x16_t)__p0, 50); 40188 return __ret; 40189 } 40190 #else 40191 __ai __attribute__((target("neon"))) uint32x4_t vcvtnq_u32_f32(float32x4_t __p0) { 40192 uint32x4_t __ret; 40193 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40194 __ret = (uint32x4_t) __builtin_neon_vcvtnq_u32_v((int8x16_t)__rev0, 50); 40195 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40196 return __ret; 40197 } 40198 #endif 40199 40200 #ifdef __LITTLE_ENDIAN__ 40201 __ai __attribute__((target("neon"))) uint32x2_t vcvtn_u32_f32(float32x2_t __p0) { 40202 uint32x2_t __ret; 40203 __ret = (uint32x2_t) __builtin_neon_vcvtn_u32_v((int8x8_t)__p0, 18); 40204 return __ret; 40205 } 40206 #else 40207 __ai __attribute__((target("neon"))) uint32x2_t vcvtn_u32_f32(float32x2_t __p0) { 40208 uint32x2_t __ret; 40209 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 40210 __ret = (uint32x2_t) __builtin_neon_vcvtn_u32_v((int8x8_t)__rev0, 18); 40211 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 40212 return __ret; 40213 } 40214 #endif 40215 40216 #ifdef __LITTLE_ENDIAN__ 40217 __ai __attribute__((target("neon"))) int32x4_t vcvtpq_s32_f32(float32x4_t __p0) { 40218 int32x4_t __ret; 40219 __ret = (int32x4_t) __builtin_neon_vcvtpq_s32_v((int8x16_t)__p0, 34); 40220 return __ret; 40221 } 40222 #else 40223 __ai __attribute__((target("neon"))) int32x4_t vcvtpq_s32_f32(float32x4_t __p0) { 40224 int32x4_t __ret; 40225 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40226 __ret = (int32x4_t) __builtin_neon_vcvtpq_s32_v((int8x16_t)__rev0, 34); 40227 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40228 return __ret; 40229 } 40230 #endif 40231 40232 #ifdef __LITTLE_ENDIAN__ 40233 __ai __attribute__((target("neon"))) int32x2_t vcvtp_s32_f32(float32x2_t __p0) { 40234 int32x2_t __ret; 40235 __ret = (int32x2_t) __builtin_neon_vcvtp_s32_v((int8x8_t)__p0, 2); 40236 return __ret; 40237 } 40238 #else 40239 __ai __attribute__((target("neon"))) int32x2_t vcvtp_s32_f32(float32x2_t __p0) { 40240 int32x2_t __ret; 40241 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 40242 __ret = (int32x2_t) __builtin_neon_vcvtp_s32_v((int8x8_t)__rev0, 2); 40243 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 40244 return __ret; 40245 } 40246 #endif 40247 40248 #ifdef __LITTLE_ENDIAN__ 40249 __ai __attribute__((target("neon"))) uint32x4_t vcvtpq_u32_f32(float32x4_t __p0) { 40250 uint32x4_t __ret; 40251 __ret = (uint32x4_t) __builtin_neon_vcvtpq_u32_v((int8x16_t)__p0, 50); 40252 return __ret; 40253 } 40254 #else 40255 __ai __attribute__((target("neon"))) uint32x4_t vcvtpq_u32_f32(float32x4_t __p0) { 40256 uint32x4_t __ret; 40257 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40258 __ret = (uint32x4_t) __builtin_neon_vcvtpq_u32_v((int8x16_t)__rev0, 50); 40259 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40260 return __ret; 40261 } 40262 #endif 40263 40264 #ifdef __LITTLE_ENDIAN__ 40265 __ai __attribute__((target("neon"))) uint32x2_t vcvtp_u32_f32(float32x2_t __p0) { 40266 uint32x2_t __ret; 40267 __ret = (uint32x2_t) __builtin_neon_vcvtp_u32_v((int8x8_t)__p0, 18); 40268 return __ret; 40269 } 40270 #else 40271 __ai __attribute__((target("neon"))) uint32x2_t vcvtp_u32_f32(float32x2_t __p0) { 40272 uint32x2_t __ret; 40273 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 40274 __ret = (uint32x2_t) __builtin_neon_vcvtp_u32_v((int8x8_t)__rev0, 18); 40275 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 40276 return __ret; 40277 } 40278 #endif 40279 40280 #ifdef __LITTLE_ENDIAN__ 40281 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha1cq_u32(uint32x4_t __p0, uint32_t __p1, uint32x4_t __p2) { 40282 uint32x4_t __ret; 40283 __ret = (uint32x4_t) __builtin_neon_vsha1cq_u32(__p0, __p1, __p2); 40284 return __ret; 40285 } 40286 #else 40287 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha1cq_u32(uint32x4_t __p0, uint32_t __p1, uint32x4_t __p2) { 40288 uint32x4_t __ret; 40289 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40290 uint32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 40291 __ret = (uint32x4_t) __builtin_neon_vsha1cq_u32(__rev0, __p1, __rev2); 40292 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40293 return __ret; 40294 } 40295 #endif 40296 40297 __ai __attribute__((target("sha2,neon"))) uint32_t vsha1h_u32(uint32_t __p0) { 40298 uint32_t __ret; 40299 __ret = (uint32_t) __builtin_neon_vsha1h_u32(__p0); 40300 return __ret; 40301 } 40302 #ifdef __LITTLE_ENDIAN__ 40303 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha1mq_u32(uint32x4_t __p0, uint32_t __p1, uint32x4_t __p2) { 40304 uint32x4_t __ret; 40305 __ret = (uint32x4_t) __builtin_neon_vsha1mq_u32(__p0, __p1, __p2); 40306 return __ret; 40307 } 40308 #else 40309 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha1mq_u32(uint32x4_t __p0, uint32_t __p1, uint32x4_t __p2) { 40310 uint32x4_t __ret; 40311 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40312 uint32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 40313 __ret = (uint32x4_t) __builtin_neon_vsha1mq_u32(__rev0, __p1, __rev2); 40314 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40315 return __ret; 40316 } 40317 #endif 40318 40319 #ifdef __LITTLE_ENDIAN__ 40320 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha1pq_u32(uint32x4_t __p0, uint32_t __p1, uint32x4_t __p2) { 40321 uint32x4_t __ret; 40322 __ret = (uint32x4_t) __builtin_neon_vsha1pq_u32(__p0, __p1, __p2); 40323 return __ret; 40324 } 40325 #else 40326 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha1pq_u32(uint32x4_t __p0, uint32_t __p1, uint32x4_t __p2) { 40327 uint32x4_t __ret; 40328 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40329 uint32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 40330 __ret = (uint32x4_t) __builtin_neon_vsha1pq_u32(__rev0, __p1, __rev2); 40331 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40332 return __ret; 40333 } 40334 #endif 40335 40336 #ifdef __LITTLE_ENDIAN__ 40337 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha1su0q_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 40338 uint32x4_t __ret; 40339 __ret = (uint32x4_t) __builtin_neon_vsha1su0q_u32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 50); 40340 return __ret; 40341 } 40342 #else 40343 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha1su0q_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 40344 uint32x4_t __ret; 40345 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40346 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 40347 uint32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 40348 __ret = (uint32x4_t) __builtin_neon_vsha1su0q_u32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 50); 40349 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40350 return __ret; 40351 } 40352 #endif 40353 40354 #ifdef __LITTLE_ENDIAN__ 40355 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha1su1q_u32(uint32x4_t __p0, uint32x4_t __p1) { 40356 uint32x4_t __ret; 40357 __ret = (uint32x4_t) __builtin_neon_vsha1su1q_u32((int8x16_t)__p0, (int8x16_t)__p1, 50); 40358 return __ret; 40359 } 40360 #else 40361 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha1su1q_u32(uint32x4_t __p0, uint32x4_t __p1) { 40362 uint32x4_t __ret; 40363 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40364 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 40365 __ret = (uint32x4_t) __builtin_neon_vsha1su1q_u32((int8x16_t)__rev0, (int8x16_t)__rev1, 50); 40366 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40367 return __ret; 40368 } 40369 #endif 40370 40371 #ifdef __LITTLE_ENDIAN__ 40372 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha256hq_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 40373 uint32x4_t __ret; 40374 __ret = (uint32x4_t) __builtin_neon_vsha256hq_u32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 50); 40375 return __ret; 40376 } 40377 #else 40378 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha256hq_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 40379 uint32x4_t __ret; 40380 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40381 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 40382 uint32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 40383 __ret = (uint32x4_t) __builtin_neon_vsha256hq_u32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 50); 40384 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40385 return __ret; 40386 } 40387 #endif 40388 40389 #ifdef __LITTLE_ENDIAN__ 40390 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha256h2q_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 40391 uint32x4_t __ret; 40392 __ret = (uint32x4_t) __builtin_neon_vsha256h2q_u32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 50); 40393 return __ret; 40394 } 40395 #else 40396 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha256h2q_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 40397 uint32x4_t __ret; 40398 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40399 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 40400 uint32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 40401 __ret = (uint32x4_t) __builtin_neon_vsha256h2q_u32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 50); 40402 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40403 return __ret; 40404 } 40405 #endif 40406 40407 #ifdef __LITTLE_ENDIAN__ 40408 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha256su0q_u32(uint32x4_t __p0, uint32x4_t __p1) { 40409 uint32x4_t __ret; 40410 __ret = (uint32x4_t) __builtin_neon_vsha256su0q_u32((int8x16_t)__p0, (int8x16_t)__p1, 50); 40411 return __ret; 40412 } 40413 #else 40414 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha256su0q_u32(uint32x4_t __p0, uint32x4_t __p1) { 40415 uint32x4_t __ret; 40416 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40417 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 40418 __ret = (uint32x4_t) __builtin_neon_vsha256su0q_u32((int8x16_t)__rev0, (int8x16_t)__rev1, 50); 40419 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40420 return __ret; 40421 } 40422 #endif 40423 40424 #ifdef __LITTLE_ENDIAN__ 40425 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha256su1q_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 40426 uint32x4_t __ret; 40427 __ret = (uint32x4_t) __builtin_neon_vsha256su1q_u32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 50); 40428 return __ret; 40429 } 40430 #else 40431 __ai __attribute__((target("sha2,neon"))) uint32x4_t vsha256su1q_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 40432 uint32x4_t __ret; 40433 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40434 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 40435 uint32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 40436 __ret = (uint32x4_t) __builtin_neon_vsha256su1q_u32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 50); 40437 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40438 return __ret; 40439 } 40440 #endif 40441 40442 #endif 40443 #if __ARM_ARCH >= 8 && defined(__ARM_FEATURE_DIRECTED_ROUNDING) 40444 #ifdef __LITTLE_ENDIAN__ 40445 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrndq_f16(float16x8_t __p0) { 40446 float16x8_t __ret; 40447 __ret = (float16x8_t) __builtin_neon_vrndq_f16((int8x16_t)__p0, 40); 40448 return __ret; 40449 } 40450 #else 40451 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrndq_f16(float16x8_t __p0) { 40452 float16x8_t __ret; 40453 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 40454 __ret = (float16x8_t) __builtin_neon_vrndq_f16((int8x16_t)__rev0, 40); 40455 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 40456 return __ret; 40457 } 40458 #endif 40459 40460 #ifdef __LITTLE_ENDIAN__ 40461 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrnd_f16(float16x4_t __p0) { 40462 float16x4_t __ret; 40463 __ret = (float16x4_t) __builtin_neon_vrnd_f16((int8x8_t)__p0, 8); 40464 return __ret; 40465 } 40466 #else 40467 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrnd_f16(float16x4_t __p0) { 40468 float16x4_t __ret; 40469 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40470 __ret = (float16x4_t) __builtin_neon_vrnd_f16((int8x8_t)__rev0, 8); 40471 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40472 return __ret; 40473 } 40474 #endif 40475 40476 #ifdef __LITTLE_ENDIAN__ 40477 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrndaq_f16(float16x8_t __p0) { 40478 float16x8_t __ret; 40479 __ret = (float16x8_t) __builtin_neon_vrndaq_f16((int8x16_t)__p0, 40); 40480 return __ret; 40481 } 40482 #else 40483 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrndaq_f16(float16x8_t __p0) { 40484 float16x8_t __ret; 40485 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 40486 __ret = (float16x8_t) __builtin_neon_vrndaq_f16((int8x16_t)__rev0, 40); 40487 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 40488 return __ret; 40489 } 40490 #endif 40491 40492 #ifdef __LITTLE_ENDIAN__ 40493 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrnda_f16(float16x4_t __p0) { 40494 float16x4_t __ret; 40495 __ret = (float16x4_t) __builtin_neon_vrnda_f16((int8x8_t)__p0, 8); 40496 return __ret; 40497 } 40498 #else 40499 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrnda_f16(float16x4_t __p0) { 40500 float16x4_t __ret; 40501 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40502 __ret = (float16x4_t) __builtin_neon_vrnda_f16((int8x8_t)__rev0, 8); 40503 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40504 return __ret; 40505 } 40506 #endif 40507 40508 #ifdef __LITTLE_ENDIAN__ 40509 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrndmq_f16(float16x8_t __p0) { 40510 float16x8_t __ret; 40511 __ret = (float16x8_t) __builtin_neon_vrndmq_f16((int8x16_t)__p0, 40); 40512 return __ret; 40513 } 40514 #else 40515 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrndmq_f16(float16x8_t __p0) { 40516 float16x8_t __ret; 40517 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 40518 __ret = (float16x8_t) __builtin_neon_vrndmq_f16((int8x16_t)__rev0, 40); 40519 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 40520 return __ret; 40521 } 40522 #endif 40523 40524 #ifdef __LITTLE_ENDIAN__ 40525 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrndm_f16(float16x4_t __p0) { 40526 float16x4_t __ret; 40527 __ret = (float16x4_t) __builtin_neon_vrndm_f16((int8x8_t)__p0, 8); 40528 return __ret; 40529 } 40530 #else 40531 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrndm_f16(float16x4_t __p0) { 40532 float16x4_t __ret; 40533 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40534 __ret = (float16x4_t) __builtin_neon_vrndm_f16((int8x8_t)__rev0, 8); 40535 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40536 return __ret; 40537 } 40538 #endif 40539 40540 #ifdef __LITTLE_ENDIAN__ 40541 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrndnq_f16(float16x8_t __p0) { 40542 float16x8_t __ret; 40543 __ret = (float16x8_t) __builtin_neon_vrndnq_f16((int8x16_t)__p0, 40); 40544 return __ret; 40545 } 40546 #else 40547 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrndnq_f16(float16x8_t __p0) { 40548 float16x8_t __ret; 40549 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 40550 __ret = (float16x8_t) __builtin_neon_vrndnq_f16((int8x16_t)__rev0, 40); 40551 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 40552 return __ret; 40553 } 40554 #endif 40555 40556 #ifdef __LITTLE_ENDIAN__ 40557 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrndn_f16(float16x4_t __p0) { 40558 float16x4_t __ret; 40559 __ret = (float16x4_t) __builtin_neon_vrndn_f16((int8x8_t)__p0, 8); 40560 return __ret; 40561 } 40562 #else 40563 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrndn_f16(float16x4_t __p0) { 40564 float16x4_t __ret; 40565 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40566 __ret = (float16x4_t) __builtin_neon_vrndn_f16((int8x8_t)__rev0, 8); 40567 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40568 return __ret; 40569 } 40570 #endif 40571 40572 #ifdef __LITTLE_ENDIAN__ 40573 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrndpq_f16(float16x8_t __p0) { 40574 float16x8_t __ret; 40575 __ret = (float16x8_t) __builtin_neon_vrndpq_f16((int8x16_t)__p0, 40); 40576 return __ret; 40577 } 40578 #else 40579 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrndpq_f16(float16x8_t __p0) { 40580 float16x8_t __ret; 40581 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 40582 __ret = (float16x8_t) __builtin_neon_vrndpq_f16((int8x16_t)__rev0, 40); 40583 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 40584 return __ret; 40585 } 40586 #endif 40587 40588 #ifdef __LITTLE_ENDIAN__ 40589 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrndp_f16(float16x4_t __p0) { 40590 float16x4_t __ret; 40591 __ret = (float16x4_t) __builtin_neon_vrndp_f16((int8x8_t)__p0, 8); 40592 return __ret; 40593 } 40594 #else 40595 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrndp_f16(float16x4_t __p0) { 40596 float16x4_t __ret; 40597 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40598 __ret = (float16x4_t) __builtin_neon_vrndp_f16((int8x8_t)__rev0, 8); 40599 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40600 return __ret; 40601 } 40602 #endif 40603 40604 #ifdef __LITTLE_ENDIAN__ 40605 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrndxq_f16(float16x8_t __p0) { 40606 float16x8_t __ret; 40607 __ret = (float16x8_t) __builtin_neon_vrndxq_f16((int8x16_t)__p0, 40); 40608 return __ret; 40609 } 40610 #else 40611 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrndxq_f16(float16x8_t __p0) { 40612 float16x8_t __ret; 40613 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 40614 __ret = (float16x8_t) __builtin_neon_vrndxq_f16((int8x16_t)__rev0, 40); 40615 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 40616 return __ret; 40617 } 40618 #endif 40619 40620 #ifdef __LITTLE_ENDIAN__ 40621 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrndx_f16(float16x4_t __p0) { 40622 float16x4_t __ret; 40623 __ret = (float16x4_t) __builtin_neon_vrndx_f16((int8x8_t)__p0, 8); 40624 return __ret; 40625 } 40626 #else 40627 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrndx_f16(float16x4_t __p0) { 40628 float16x4_t __ret; 40629 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40630 __ret = (float16x4_t) __builtin_neon_vrndx_f16((int8x8_t)__rev0, 8); 40631 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40632 return __ret; 40633 } 40634 #endif 40635 40636 #ifdef __LITTLE_ENDIAN__ 40637 __ai __attribute__((target("neon"))) float32x4_t vrndq_f32(float32x4_t __p0) { 40638 float32x4_t __ret; 40639 __ret = (float32x4_t) __builtin_neon_vrndq_v((int8x16_t)__p0, 41); 40640 return __ret; 40641 } 40642 #else 40643 __ai __attribute__((target("neon"))) float32x4_t vrndq_f32(float32x4_t __p0) { 40644 float32x4_t __ret; 40645 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40646 __ret = (float32x4_t) __builtin_neon_vrndq_v((int8x16_t)__rev0, 41); 40647 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40648 return __ret; 40649 } 40650 #endif 40651 40652 #ifdef __LITTLE_ENDIAN__ 40653 __ai __attribute__((target("neon"))) float32x2_t vrnd_f32(float32x2_t __p0) { 40654 float32x2_t __ret; 40655 __ret = (float32x2_t) __builtin_neon_vrnd_v((int8x8_t)__p0, 9); 40656 return __ret; 40657 } 40658 #else 40659 __ai __attribute__((target("neon"))) float32x2_t vrnd_f32(float32x2_t __p0) { 40660 float32x2_t __ret; 40661 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 40662 __ret = (float32x2_t) __builtin_neon_vrnd_v((int8x8_t)__rev0, 9); 40663 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 40664 return __ret; 40665 } 40666 #endif 40667 40668 #ifdef __LITTLE_ENDIAN__ 40669 __ai __attribute__((target("neon"))) float32x4_t vrndaq_f32(float32x4_t __p0) { 40670 float32x4_t __ret; 40671 __ret = (float32x4_t) __builtin_neon_vrndaq_v((int8x16_t)__p0, 41); 40672 return __ret; 40673 } 40674 #else 40675 __ai __attribute__((target("neon"))) float32x4_t vrndaq_f32(float32x4_t __p0) { 40676 float32x4_t __ret; 40677 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40678 __ret = (float32x4_t) __builtin_neon_vrndaq_v((int8x16_t)__rev0, 41); 40679 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40680 return __ret; 40681 } 40682 #endif 40683 40684 #ifdef __LITTLE_ENDIAN__ 40685 __ai __attribute__((target("neon"))) float32x2_t vrnda_f32(float32x2_t __p0) { 40686 float32x2_t __ret; 40687 __ret = (float32x2_t) __builtin_neon_vrnda_v((int8x8_t)__p0, 9); 40688 return __ret; 40689 } 40690 #else 40691 __ai __attribute__((target("neon"))) float32x2_t vrnda_f32(float32x2_t __p0) { 40692 float32x2_t __ret; 40693 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 40694 __ret = (float32x2_t) __builtin_neon_vrnda_v((int8x8_t)__rev0, 9); 40695 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 40696 return __ret; 40697 } 40698 #endif 40699 40700 #ifdef __LITTLE_ENDIAN__ 40701 __ai __attribute__((target("neon"))) float32x4_t vrndiq_f32(float32x4_t __p0) { 40702 float32x4_t __ret; 40703 __ret = (float32x4_t) __builtin_neon_vrndiq_v((int8x16_t)__p0, 41); 40704 return __ret; 40705 } 40706 #else 40707 __ai __attribute__((target("neon"))) float32x4_t vrndiq_f32(float32x4_t __p0) { 40708 float32x4_t __ret; 40709 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40710 __ret = (float32x4_t) __builtin_neon_vrndiq_v((int8x16_t)__rev0, 41); 40711 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40712 return __ret; 40713 } 40714 #endif 40715 40716 #ifdef __LITTLE_ENDIAN__ 40717 __ai __attribute__((target("neon"))) float32x2_t vrndi_f32(float32x2_t __p0) { 40718 float32x2_t __ret; 40719 __ret = (float32x2_t) __builtin_neon_vrndi_v((int8x8_t)__p0, 9); 40720 return __ret; 40721 } 40722 #else 40723 __ai __attribute__((target("neon"))) float32x2_t vrndi_f32(float32x2_t __p0) { 40724 float32x2_t __ret; 40725 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 40726 __ret = (float32x2_t) __builtin_neon_vrndi_v((int8x8_t)__rev0, 9); 40727 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 40728 return __ret; 40729 } 40730 #endif 40731 40732 #ifdef __LITTLE_ENDIAN__ 40733 __ai __attribute__((target("neon"))) float32x4_t vrndmq_f32(float32x4_t __p0) { 40734 float32x4_t __ret; 40735 __ret = (float32x4_t) __builtin_neon_vrndmq_v((int8x16_t)__p0, 41); 40736 return __ret; 40737 } 40738 #else 40739 __ai __attribute__((target("neon"))) float32x4_t vrndmq_f32(float32x4_t __p0) { 40740 float32x4_t __ret; 40741 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40742 __ret = (float32x4_t) __builtin_neon_vrndmq_v((int8x16_t)__rev0, 41); 40743 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40744 return __ret; 40745 } 40746 #endif 40747 40748 #ifdef __LITTLE_ENDIAN__ 40749 __ai __attribute__((target("neon"))) float32x2_t vrndm_f32(float32x2_t __p0) { 40750 float32x2_t __ret; 40751 __ret = (float32x2_t) __builtin_neon_vrndm_v((int8x8_t)__p0, 9); 40752 return __ret; 40753 } 40754 #else 40755 __ai __attribute__((target("neon"))) float32x2_t vrndm_f32(float32x2_t __p0) { 40756 float32x2_t __ret; 40757 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 40758 __ret = (float32x2_t) __builtin_neon_vrndm_v((int8x8_t)__rev0, 9); 40759 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 40760 return __ret; 40761 } 40762 #endif 40763 40764 #ifdef __LITTLE_ENDIAN__ 40765 __ai __attribute__((target("neon"))) float32x4_t vrndnq_f32(float32x4_t __p0) { 40766 float32x4_t __ret; 40767 __ret = (float32x4_t) __builtin_neon_vrndnq_v((int8x16_t)__p0, 41); 40768 return __ret; 40769 } 40770 #else 40771 __ai __attribute__((target("neon"))) float32x4_t vrndnq_f32(float32x4_t __p0) { 40772 float32x4_t __ret; 40773 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40774 __ret = (float32x4_t) __builtin_neon_vrndnq_v((int8x16_t)__rev0, 41); 40775 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40776 return __ret; 40777 } 40778 #endif 40779 40780 #ifdef __LITTLE_ENDIAN__ 40781 __ai __attribute__((target("neon"))) float32x2_t vrndn_f32(float32x2_t __p0) { 40782 float32x2_t __ret; 40783 __ret = (float32x2_t) __builtin_neon_vrndn_v((int8x8_t)__p0, 9); 40784 return __ret; 40785 } 40786 #else 40787 __ai __attribute__((target("neon"))) float32x2_t vrndn_f32(float32x2_t __p0) { 40788 float32x2_t __ret; 40789 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 40790 __ret = (float32x2_t) __builtin_neon_vrndn_v((int8x8_t)__rev0, 9); 40791 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 40792 return __ret; 40793 } 40794 #endif 40795 40796 __ai __attribute__((target("neon"))) float32_t vrndns_f32(float32_t __p0) { 40797 float32_t __ret; 40798 __ret = (float32_t) __builtin_neon_vrndns_f32(__p0); 40799 return __ret; 40800 } 40801 #ifdef __LITTLE_ENDIAN__ 40802 __ai __attribute__((target("neon"))) float32x4_t vrndpq_f32(float32x4_t __p0) { 40803 float32x4_t __ret; 40804 __ret = (float32x4_t) __builtin_neon_vrndpq_v((int8x16_t)__p0, 41); 40805 return __ret; 40806 } 40807 #else 40808 __ai __attribute__((target("neon"))) float32x4_t vrndpq_f32(float32x4_t __p0) { 40809 float32x4_t __ret; 40810 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40811 __ret = (float32x4_t) __builtin_neon_vrndpq_v((int8x16_t)__rev0, 41); 40812 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40813 return __ret; 40814 } 40815 #endif 40816 40817 #ifdef __LITTLE_ENDIAN__ 40818 __ai __attribute__((target("neon"))) float32x2_t vrndp_f32(float32x2_t __p0) { 40819 float32x2_t __ret; 40820 __ret = (float32x2_t) __builtin_neon_vrndp_v((int8x8_t)__p0, 9); 40821 return __ret; 40822 } 40823 #else 40824 __ai __attribute__((target("neon"))) float32x2_t vrndp_f32(float32x2_t __p0) { 40825 float32x2_t __ret; 40826 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 40827 __ret = (float32x2_t) __builtin_neon_vrndp_v((int8x8_t)__rev0, 9); 40828 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 40829 return __ret; 40830 } 40831 #endif 40832 40833 #ifdef __LITTLE_ENDIAN__ 40834 __ai __attribute__((target("neon"))) float32x4_t vrndxq_f32(float32x4_t __p0) { 40835 float32x4_t __ret; 40836 __ret = (float32x4_t) __builtin_neon_vrndxq_v((int8x16_t)__p0, 41); 40837 return __ret; 40838 } 40839 #else 40840 __ai __attribute__((target("neon"))) float32x4_t vrndxq_f32(float32x4_t __p0) { 40841 float32x4_t __ret; 40842 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40843 __ret = (float32x4_t) __builtin_neon_vrndxq_v((int8x16_t)__rev0, 41); 40844 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40845 return __ret; 40846 } 40847 #endif 40848 40849 #ifdef __LITTLE_ENDIAN__ 40850 __ai __attribute__((target("neon"))) float32x2_t vrndx_f32(float32x2_t __p0) { 40851 float32x2_t __ret; 40852 __ret = (float32x2_t) __builtin_neon_vrndx_v((int8x8_t)__p0, 9); 40853 return __ret; 40854 } 40855 #else 40856 __ai __attribute__((target("neon"))) float32x2_t vrndx_f32(float32x2_t __p0) { 40857 float32x2_t __ret; 40858 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 40859 __ret = (float32x2_t) __builtin_neon_vrndx_v((int8x8_t)__rev0, 9); 40860 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 40861 return __ret; 40862 } 40863 #endif 40864 40865 #endif 40866 #if __ARM_ARCH >= 8 && defined(__ARM_FEATURE_NUMERIC_MAXMIN) 40867 #ifdef __LITTLE_ENDIAN__ 40868 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vmaxnmq_f16(float16x8_t __p0, float16x8_t __p1) { 40869 float16x8_t __ret; 40870 __ret = (float16x8_t) __builtin_neon_vmaxnmq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40); 40871 return __ret; 40872 } 40873 #else 40874 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vmaxnmq_f16(float16x8_t __p0, float16x8_t __p1) { 40875 float16x8_t __ret; 40876 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 40877 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 40878 __ret = (float16x8_t) __builtin_neon_vmaxnmq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40); 40879 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 40880 return __ret; 40881 } 40882 #endif 40883 40884 #ifdef __LITTLE_ENDIAN__ 40885 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vmaxnm_f16(float16x4_t __p0, float16x4_t __p1) { 40886 float16x4_t __ret; 40887 __ret = (float16x4_t) __builtin_neon_vmaxnm_f16((int8x8_t)__p0, (int8x8_t)__p1, 8); 40888 return __ret; 40889 } 40890 #else 40891 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vmaxnm_f16(float16x4_t __p0, float16x4_t __p1) { 40892 float16x4_t __ret; 40893 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40894 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 40895 __ret = (float16x4_t) __builtin_neon_vmaxnm_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8); 40896 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40897 return __ret; 40898 } 40899 #endif 40900 40901 #ifdef __LITTLE_ENDIAN__ 40902 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vminnmq_f16(float16x8_t __p0, float16x8_t __p1) { 40903 float16x8_t __ret; 40904 __ret = (float16x8_t) __builtin_neon_vminnmq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40); 40905 return __ret; 40906 } 40907 #else 40908 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vminnmq_f16(float16x8_t __p0, float16x8_t __p1) { 40909 float16x8_t __ret; 40910 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 40911 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 40912 __ret = (float16x8_t) __builtin_neon_vminnmq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40); 40913 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 40914 return __ret; 40915 } 40916 #endif 40917 40918 #ifdef __LITTLE_ENDIAN__ 40919 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vminnm_f16(float16x4_t __p0, float16x4_t __p1) { 40920 float16x4_t __ret; 40921 __ret = (float16x4_t) __builtin_neon_vminnm_f16((int8x8_t)__p0, (int8x8_t)__p1, 8); 40922 return __ret; 40923 } 40924 #else 40925 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vminnm_f16(float16x4_t __p0, float16x4_t __p1) { 40926 float16x4_t __ret; 40927 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40928 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 40929 __ret = (float16x4_t) __builtin_neon_vminnm_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8); 40930 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40931 return __ret; 40932 } 40933 #endif 40934 40935 #ifdef __LITTLE_ENDIAN__ 40936 __ai __attribute__((target("neon"))) float32x4_t vmaxnmq_f32(float32x4_t __p0, float32x4_t __p1) { 40937 float32x4_t __ret; 40938 __ret = (float32x4_t) __builtin_neon_vmaxnmq_v((int8x16_t)__p0, (int8x16_t)__p1, 41); 40939 return __ret; 40940 } 40941 #else 40942 __ai __attribute__((target("neon"))) float32x4_t vmaxnmq_f32(float32x4_t __p0, float32x4_t __p1) { 40943 float32x4_t __ret; 40944 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40945 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 40946 __ret = (float32x4_t) __builtin_neon_vmaxnmq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 41); 40947 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40948 return __ret; 40949 } 40950 #endif 40951 40952 #ifdef __LITTLE_ENDIAN__ 40953 __ai __attribute__((target("neon"))) float32x2_t vmaxnm_f32(float32x2_t __p0, float32x2_t __p1) { 40954 float32x2_t __ret; 40955 __ret = (float32x2_t) __builtin_neon_vmaxnm_v((int8x8_t)__p0, (int8x8_t)__p1, 9); 40956 return __ret; 40957 } 40958 #else 40959 __ai __attribute__((target("neon"))) float32x2_t vmaxnm_f32(float32x2_t __p0, float32x2_t __p1) { 40960 float32x2_t __ret; 40961 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 40962 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 40963 __ret = (float32x2_t) __builtin_neon_vmaxnm_v((int8x8_t)__rev0, (int8x8_t)__rev1, 9); 40964 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 40965 return __ret; 40966 } 40967 #endif 40968 40969 #ifdef __LITTLE_ENDIAN__ 40970 __ai __attribute__((target("neon"))) float32x4_t vminnmq_f32(float32x4_t __p0, float32x4_t __p1) { 40971 float32x4_t __ret; 40972 __ret = (float32x4_t) __builtin_neon_vminnmq_v((int8x16_t)__p0, (int8x16_t)__p1, 41); 40973 return __ret; 40974 } 40975 #else 40976 __ai __attribute__((target("neon"))) float32x4_t vminnmq_f32(float32x4_t __p0, float32x4_t __p1) { 40977 float32x4_t __ret; 40978 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 40979 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 40980 __ret = (float32x4_t) __builtin_neon_vminnmq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 41); 40981 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 40982 return __ret; 40983 } 40984 #endif 40985 40986 #ifdef __LITTLE_ENDIAN__ 40987 __ai __attribute__((target("neon"))) float32x2_t vminnm_f32(float32x2_t __p0, float32x2_t __p1) { 40988 float32x2_t __ret; 40989 __ret = (float32x2_t) __builtin_neon_vminnm_v((int8x8_t)__p0, (int8x8_t)__p1, 9); 40990 return __ret; 40991 } 40992 #else 40993 __ai __attribute__((target("neon"))) float32x2_t vminnm_f32(float32x2_t __p0, float32x2_t __p1) { 40994 float32x2_t __ret; 40995 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 40996 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 40997 __ret = (float32x2_t) __builtin_neon_vminnm_v((int8x8_t)__rev0, (int8x8_t)__rev1, 9); 40998 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 40999 return __ret; 41000 } 41001 #endif 41002 41003 #endif 41004 #if defined(__ARM_FEATURE_FMA) 41005 #ifdef __LITTLE_ENDIAN__ 41006 __ai __attribute__((target("neon"))) float32x4_t vfmaq_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) { 41007 float32x4_t __ret; 41008 __ret = (float32x4_t) __builtin_neon_vfmaq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41); 41009 return __ret; 41010 } 41011 #else 41012 __ai __attribute__((target("neon"))) float32x4_t vfmaq_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) { 41013 float32x4_t __ret; 41014 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 41015 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 41016 float32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 41017 __ret = (float32x4_t) __builtin_neon_vfmaq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 41); 41018 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 41019 return __ret; 41020 } 41021 __ai __attribute__((target("neon"))) float32x4_t __noswap_vfmaq_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) { 41022 float32x4_t __ret; 41023 __ret = (float32x4_t) __builtin_neon_vfmaq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41); 41024 return __ret; 41025 } 41026 #endif 41027 41028 #ifdef __LITTLE_ENDIAN__ 41029 __ai __attribute__((target("neon"))) float32x2_t vfma_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) { 41030 float32x2_t __ret; 41031 __ret = (float32x2_t) __builtin_neon_vfma_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9); 41032 return __ret; 41033 } 41034 #else 41035 __ai __attribute__((target("neon"))) float32x2_t vfma_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) { 41036 float32x2_t __ret; 41037 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 41038 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 41039 float32x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 41040 __ret = (float32x2_t) __builtin_neon_vfma_v((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 9); 41041 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 41042 return __ret; 41043 } 41044 __ai __attribute__((target("neon"))) float32x2_t __noswap_vfma_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) { 41045 float32x2_t __ret; 41046 __ret = (float32x2_t) __builtin_neon_vfma_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9); 41047 return __ret; 41048 } 41049 #endif 41050 41051 #ifdef __LITTLE_ENDIAN__ 41052 __ai __attribute__((target("neon"))) float32x4_t vfmaq_n_f32(float32x4_t __p0, float32x4_t __p1, float32_t __p2) { 41053 float32x4_t __ret; 41054 __ret = vfmaq_f32(__p0, __p1, (float32x4_t) {__p2, __p2, __p2, __p2}); 41055 return __ret; 41056 } 41057 #else 41058 __ai __attribute__((target("neon"))) float32x4_t vfmaq_n_f32(float32x4_t __p0, float32x4_t __p1, float32_t __p2) { 41059 float32x4_t __ret; 41060 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 41061 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 41062 __ret = __noswap_vfmaq_f32(__rev0, __rev1, (float32x4_t) {__p2, __p2, __p2, __p2}); 41063 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 41064 return __ret; 41065 } 41066 #endif 41067 41068 #ifdef __LITTLE_ENDIAN__ 41069 __ai __attribute__((target("neon"))) float32x2_t vfma_n_f32(float32x2_t __p0, float32x2_t __p1, float32_t __p2) { 41070 float32x2_t __ret; 41071 __ret = vfma_f32(__p0, __p1, (float32x2_t) {__p2, __p2}); 41072 return __ret; 41073 } 41074 #else 41075 __ai __attribute__((target("neon"))) float32x2_t vfma_n_f32(float32x2_t __p0, float32x2_t __p1, float32_t __p2) { 41076 float32x2_t __ret; 41077 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 41078 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 41079 __ret = __noswap_vfma_f32(__rev0, __rev1, (float32x2_t) {__p2, __p2}); 41080 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 41081 return __ret; 41082 } 41083 #endif 41084 41085 #ifdef __LITTLE_ENDIAN__ 41086 __ai __attribute__((target("neon"))) float32x4_t vfmsq_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) { 41087 float32x4_t __ret; 41088 __ret = vfmaq_f32(__p0, -__p1, __p2); 41089 return __ret; 41090 } 41091 #else 41092 __ai __attribute__((target("neon"))) float32x4_t vfmsq_f32(float32x4_t __p0, float32x4_t __p1, float32x4_t __p2) { 41093 float32x4_t __ret; 41094 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 41095 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 41096 float32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 41097 __ret = __noswap_vfmaq_f32(__rev0, -__rev1, __rev2); 41098 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 41099 return __ret; 41100 } 41101 #endif 41102 41103 #ifdef __LITTLE_ENDIAN__ 41104 __ai __attribute__((target("neon"))) float32x2_t vfms_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) { 41105 float32x2_t __ret; 41106 __ret = vfma_f32(__p0, -__p1, __p2); 41107 return __ret; 41108 } 41109 #else 41110 __ai __attribute__((target("neon"))) float32x2_t vfms_f32(float32x2_t __p0, float32x2_t __p1, float32x2_t __p2) { 41111 float32x2_t __ret; 41112 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 41113 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 41114 float32x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 41115 __ret = __noswap_vfma_f32(__rev0, -__rev1, __rev2); 41116 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 41117 return __ret; 41118 } 41119 #endif 41120 41121 #endif 41122 #if defined(__aarch64__) 41123 #ifdef __LITTLE_ENDIAN__ 41124 __ai __attribute__((target("fp8,neon"))) bfloat16x8_t vcvt1_bf16_mf8_fpm(mfloat8x8_t __p0, fpm_t __p1) { 41125 bfloat16x8_t __ret; 41126 __ret = (bfloat16x8_t) __builtin_neon_vcvt1_bf16_mf8_fpm(__p0, __p1); 41127 return __ret; 41128 } 41129 #else 41130 __ai __attribute__((target("fp8,neon"))) bfloat16x8_t vcvt1_bf16_mf8_fpm(mfloat8x8_t __p0, fpm_t __p1) { 41131 bfloat16x8_t __ret; 41132 mfloat8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 41133 __ret = (bfloat16x8_t) __builtin_neon_vcvt1_bf16_mf8_fpm(__rev0, __p1); 41134 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 41135 return __ret; 41136 } 41137 #endif 41138 41139 #ifdef __LITTLE_ENDIAN__ 41140 __ai __attribute__((target("fp8,neon"))) float16x8_t vcvt1_f16_mf8_fpm(mfloat8x8_t __p0, fpm_t __p1) { 41141 float16x8_t __ret; 41142 __ret = (float16x8_t) __builtin_neon_vcvt1_f16_mf8_fpm(__p0, __p1); 41143 return __ret; 41144 } 41145 #else 41146 __ai __attribute__((target("fp8,neon"))) float16x8_t vcvt1_f16_mf8_fpm(mfloat8x8_t __p0, fpm_t __p1) { 41147 float16x8_t __ret; 41148 mfloat8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 41149 __ret = (float16x8_t) __builtin_neon_vcvt1_f16_mf8_fpm(__rev0, __p1); 41150 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 41151 return __ret; 41152 } 41153 #endif 41154 41155 #ifdef __LITTLE_ENDIAN__ 41156 __ai __attribute__((target("fp8,neon"))) bfloat16x8_t vcvt1_high_bf16_mf8_fpm(mfloat8x16_t __p0, fpm_t __p1) { 41157 bfloat16x8_t __ret; 41158 __ret = (bfloat16x8_t) __builtin_neon_vcvt1_high_bf16_mf8_fpm(__p0, __p1); 41159 return __ret; 41160 } 41161 #else 41162 __ai __attribute__((target("fp8,neon"))) bfloat16x8_t vcvt1_high_bf16_mf8_fpm(mfloat8x16_t __p0, fpm_t __p1) { 41163 bfloat16x8_t __ret; 41164 mfloat8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 41165 __ret = (bfloat16x8_t) __builtin_neon_vcvt1_high_bf16_mf8_fpm(__rev0, __p1); 41166 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 41167 return __ret; 41168 } 41169 #endif 41170 41171 #ifdef __LITTLE_ENDIAN__ 41172 __ai __attribute__((target("fp8,neon"))) float16x8_t vcvt1_high_f16_mf8_fpm(mfloat8x16_t __p0, fpm_t __p1) { 41173 float16x8_t __ret; 41174 __ret = (float16x8_t) __builtin_neon_vcvt1_high_f16_mf8_fpm(__p0, __p1); 41175 return __ret; 41176 } 41177 #else 41178 __ai __attribute__((target("fp8,neon"))) float16x8_t vcvt1_high_f16_mf8_fpm(mfloat8x16_t __p0, fpm_t __p1) { 41179 float16x8_t __ret; 41180 mfloat8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 41181 __ret = (float16x8_t) __builtin_neon_vcvt1_high_f16_mf8_fpm(__rev0, __p1); 41182 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 41183 return __ret; 41184 } 41185 #endif 41186 41187 #ifdef __LITTLE_ENDIAN__ 41188 __ai __attribute__((target("fp8,neon"))) bfloat16x8_t vcvt1_low_bf16_mf8_fpm(mfloat8x16_t __p0, fpm_t __p1) { 41189 bfloat16x8_t __ret; 41190 __ret = (bfloat16x8_t) __builtin_neon_vcvt1_low_bf16_mf8_fpm(__p0, __p1); 41191 return __ret; 41192 } 41193 #else 41194 __ai __attribute__((target("fp8,neon"))) bfloat16x8_t vcvt1_low_bf16_mf8_fpm(mfloat8x16_t __p0, fpm_t __p1) { 41195 bfloat16x8_t __ret; 41196 mfloat8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 41197 __ret = (bfloat16x8_t) __builtin_neon_vcvt1_low_bf16_mf8_fpm(__rev0, __p1); 41198 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 41199 return __ret; 41200 } 41201 #endif 41202 41203 #ifdef __LITTLE_ENDIAN__ 41204 __ai __attribute__((target("fp8,neon"))) float16x8_t vcvt1_low_f16_mf8_fpm(mfloat8x16_t __p0, fpm_t __p1) { 41205 float16x8_t __ret; 41206 __ret = (float16x8_t) __builtin_neon_vcvt1_low_f16_mf8_fpm(__p0, __p1); 41207 return __ret; 41208 } 41209 #else 41210 __ai __attribute__((target("fp8,neon"))) float16x8_t vcvt1_low_f16_mf8_fpm(mfloat8x16_t __p0, fpm_t __p1) { 41211 float16x8_t __ret; 41212 mfloat8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 41213 __ret = (float16x8_t) __builtin_neon_vcvt1_low_f16_mf8_fpm(__rev0, __p1); 41214 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 41215 return __ret; 41216 } 41217 #endif 41218 41219 #ifdef __LITTLE_ENDIAN__ 41220 __ai __attribute__((target("fp8,neon"))) bfloat16x8_t vcvt2_bf16_mf8_fpm(mfloat8x8_t __p0, fpm_t __p1) { 41221 bfloat16x8_t __ret; 41222 __ret = (bfloat16x8_t) __builtin_neon_vcvt2_bf16_mf8_fpm(__p0, __p1); 41223 return __ret; 41224 } 41225 #else 41226 __ai __attribute__((target("fp8,neon"))) bfloat16x8_t vcvt2_bf16_mf8_fpm(mfloat8x8_t __p0, fpm_t __p1) { 41227 bfloat16x8_t __ret; 41228 mfloat8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 41229 __ret = (bfloat16x8_t) __builtin_neon_vcvt2_bf16_mf8_fpm(__rev0, __p1); 41230 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 41231 return __ret; 41232 } 41233 #endif 41234 41235 #ifdef __LITTLE_ENDIAN__ 41236 __ai __attribute__((target("fp8,neon"))) float16x8_t vcvt2_f16_mf8_fpm(mfloat8x8_t __p0, fpm_t __p1) { 41237 float16x8_t __ret; 41238 __ret = (float16x8_t) __builtin_neon_vcvt2_f16_mf8_fpm(__p0, __p1); 41239 return __ret; 41240 } 41241 #else 41242 __ai __attribute__((target("fp8,neon"))) float16x8_t vcvt2_f16_mf8_fpm(mfloat8x8_t __p0, fpm_t __p1) { 41243 float16x8_t __ret; 41244 mfloat8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 41245 __ret = (float16x8_t) __builtin_neon_vcvt2_f16_mf8_fpm(__rev0, __p1); 41246 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 41247 return __ret; 41248 } 41249 #endif 41250 41251 #ifdef __LITTLE_ENDIAN__ 41252 __ai __attribute__((target("fp8,neon"))) bfloat16x8_t vcvt2_high_bf16_mf8_fpm(mfloat8x16_t __p0, fpm_t __p1) { 41253 bfloat16x8_t __ret; 41254 __ret = (bfloat16x8_t) __builtin_neon_vcvt2_high_bf16_mf8_fpm(__p0, __p1); 41255 return __ret; 41256 } 41257 #else 41258 __ai __attribute__((target("fp8,neon"))) bfloat16x8_t vcvt2_high_bf16_mf8_fpm(mfloat8x16_t __p0, fpm_t __p1) { 41259 bfloat16x8_t __ret; 41260 mfloat8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 41261 __ret = (bfloat16x8_t) __builtin_neon_vcvt2_high_bf16_mf8_fpm(__rev0, __p1); 41262 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 41263 return __ret; 41264 } 41265 #endif 41266 41267 #ifdef __LITTLE_ENDIAN__ 41268 __ai __attribute__((target("fp8,neon"))) float16x8_t vcvt2_high_f16_mf8_fpm(mfloat8x16_t __p0, fpm_t __p1) { 41269 float16x8_t __ret; 41270 __ret = (float16x8_t) __builtin_neon_vcvt2_high_f16_mf8_fpm(__p0, __p1); 41271 return __ret; 41272 } 41273 #else 41274 __ai __attribute__((target("fp8,neon"))) float16x8_t vcvt2_high_f16_mf8_fpm(mfloat8x16_t __p0, fpm_t __p1) { 41275 float16x8_t __ret; 41276 mfloat8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 41277 __ret = (float16x8_t) __builtin_neon_vcvt2_high_f16_mf8_fpm(__rev0, __p1); 41278 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 41279 return __ret; 41280 } 41281 #endif 41282 41283 #ifdef __LITTLE_ENDIAN__ 41284 __ai __attribute__((target("fp8,neon"))) bfloat16x8_t vcvt2_low_bf16_mf8_fpm(mfloat8x16_t __p0, fpm_t __p1) { 41285 bfloat16x8_t __ret; 41286 __ret = (bfloat16x8_t) __builtin_neon_vcvt2_low_bf16_mf8_fpm(__p0, __p1); 41287 return __ret; 41288 } 41289 #else 41290 __ai __attribute__((target("fp8,neon"))) bfloat16x8_t vcvt2_low_bf16_mf8_fpm(mfloat8x16_t __p0, fpm_t __p1) { 41291 bfloat16x8_t __ret; 41292 mfloat8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 41293 __ret = (bfloat16x8_t) __builtin_neon_vcvt2_low_bf16_mf8_fpm(__rev0, __p1); 41294 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 41295 return __ret; 41296 } 41297 #endif 41298 41299 #ifdef __LITTLE_ENDIAN__ 41300 __ai __attribute__((target("fp8,neon"))) float16x8_t vcvt2_low_f16_mf8_fpm(mfloat8x16_t __p0, fpm_t __p1) { 41301 float16x8_t __ret; 41302 __ret = (float16x8_t) __builtin_neon_vcvt2_low_f16_mf8_fpm(__p0, __p1); 41303 return __ret; 41304 } 41305 #else 41306 __ai __attribute__((target("fp8,neon"))) float16x8_t vcvt2_low_f16_mf8_fpm(mfloat8x16_t __p0, fpm_t __p1) { 41307 float16x8_t __ret; 41308 mfloat8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 41309 __ret = (float16x8_t) __builtin_neon_vcvt2_low_f16_mf8_fpm(__rev0, __p1); 41310 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 41311 return __ret; 41312 } 41313 #endif 41314 41315 #ifdef __LITTLE_ENDIAN__ 41316 __ai __attribute__((target("fp8,neon"))) mfloat8x16_t vcvt_high_mf8_f32_fpm(mfloat8x8_t __p0, float32x4_t __p1, float32x4_t __p2, fpm_t __p3) { 41317 mfloat8x16_t __ret; 41318 __ret = (mfloat8x16_t) __builtin_neon_vcvt_high_mf8_f32_fpm(__p0, __p1, __p2, __p3); 41319 return __ret; 41320 } 41321 #else 41322 __ai __attribute__((target("fp8,neon"))) mfloat8x16_t vcvt_high_mf8_f32_fpm(mfloat8x8_t __p0, float32x4_t __p1, float32x4_t __p2, fpm_t __p3) { 41323 mfloat8x16_t __ret; 41324 mfloat8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 41325 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 41326 float32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 41327 __ret = (mfloat8x16_t) __builtin_neon_vcvt_high_mf8_f32_fpm(__rev0, __rev1, __rev2, __p3); 41328 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 41329 return __ret; 41330 } 41331 #endif 41332 41333 #ifdef __LITTLE_ENDIAN__ 41334 __ai __attribute__((target("fp8,neon"))) mfloat8x16_t vcvtq_mf8_f16_fpm(float16x8_t __p0, float16x8_t __p1, fpm_t __p2) { 41335 mfloat8x16_t __ret; 41336 __ret = (mfloat8x16_t) __builtin_neon_vcvtq_mf8_f16_fpm((int8x16_t)__p0, (int8x16_t)__p1, __p2); 41337 return __ret; 41338 } 41339 #else 41340 __ai __attribute__((target("fp8,neon"))) mfloat8x16_t vcvtq_mf8_f16_fpm(float16x8_t __p0, float16x8_t __p1, fpm_t __p2) { 41341 mfloat8x16_t __ret; 41342 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 41343 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 41344 __ret = (mfloat8x16_t) __builtin_neon_vcvtq_mf8_f16_fpm((int8x16_t)__rev0, (int8x16_t)__rev1, __p2); 41345 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 41346 return __ret; 41347 } 41348 #endif 41349 41350 #ifdef __LITTLE_ENDIAN__ 41351 __ai __attribute__((target("fp8,neon"))) mfloat8x8_t vcvt_mf8_f16_fpm(float16x4_t __p0, float16x4_t __p1, fpm_t __p2) { 41352 mfloat8x8_t __ret; 41353 __ret = (mfloat8x8_t) __builtin_neon_vcvt_mf8_f16_fpm((int8x8_t)__p0, (int8x8_t)__p1, __p2); 41354 return __ret; 41355 } 41356 #else 41357 __ai __attribute__((target("fp8,neon"))) mfloat8x8_t vcvt_mf8_f16_fpm(float16x4_t __p0, float16x4_t __p1, fpm_t __p2) { 41358 mfloat8x8_t __ret; 41359 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 41360 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 41361 __ret = (mfloat8x8_t) __builtin_neon_vcvt_mf8_f16_fpm((int8x8_t)__rev0, (int8x8_t)__rev1, __p2); 41362 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 41363 return __ret; 41364 } 41365 #endif 41366 41367 #ifdef __LITTLE_ENDIAN__ 41368 __ai __attribute__((target("fp8,neon"))) mfloat8x8_t vcvt_mf8_f32_fpm(float32x4_t __p0, float32x4_t __p1, fpm_t __p2) { 41369 mfloat8x8_t __ret; 41370 __ret = (mfloat8x8_t) __builtin_neon_vcvt_mf8_f32_fpm(__p0, __p1, __p2); 41371 return __ret; 41372 } 41373 #else 41374 __ai __attribute__((target("fp8,neon"))) mfloat8x8_t vcvt_mf8_f32_fpm(float32x4_t __p0, float32x4_t __p1, fpm_t __p2) { 41375 mfloat8x8_t __ret; 41376 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 41377 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 41378 __ret = (mfloat8x8_t) __builtin_neon_vcvt_mf8_f32_fpm(__rev0, __rev1, __p2); 41379 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 41380 return __ret; 41381 } 41382 #endif 41383 41384 #ifdef __LITTLE_ENDIAN__ 41385 __ai __attribute__((target("fp8,neon"))) float32x2_t vscale_f32(float32x2_t __p0, int32x2_t __p1) { 41386 float32x2_t __ret; 41387 __ret = (float32x2_t) __builtin_neon_vscale_f32((int8x8_t)__p0, (int8x8_t)__p1, 9); 41388 return __ret; 41389 } 41390 #else 41391 __ai __attribute__((target("fp8,neon"))) float32x2_t vscale_f32(float32x2_t __p0, int32x2_t __p1) { 41392 float32x2_t __ret; 41393 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 41394 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 41395 __ret = (float32x2_t) __builtin_neon_vscale_f32((int8x8_t)__rev0, (int8x8_t)__rev1, 9); 41396 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 41397 return __ret; 41398 } 41399 #endif 41400 41401 #ifdef __LITTLE_ENDIAN__ 41402 __ai __attribute__((target("fp8,neon"))) float16x4_t vscale_f16(float16x4_t __p0, int16x4_t __p1) { 41403 float16x4_t __ret; 41404 __ret = (float16x4_t) __builtin_neon_vscale_f16((int8x8_t)__p0, (int8x8_t)__p1, 8); 41405 return __ret; 41406 } 41407 #else 41408 __ai __attribute__((target("fp8,neon"))) float16x4_t vscale_f16(float16x4_t __p0, int16x4_t __p1) { 41409 float16x4_t __ret; 41410 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 41411 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 41412 __ret = (float16x4_t) __builtin_neon_vscale_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8); 41413 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 41414 return __ret; 41415 } 41416 #endif 41417 41418 #ifdef __LITTLE_ENDIAN__ 41419 __ai __attribute__((target("fp8,neon"))) float64x2_t vscaleq_f64(float64x2_t __p0, int64x2_t __p1) { 41420 float64x2_t __ret; 41421 __ret = (float64x2_t) __builtin_neon_vscaleq_f64((int8x16_t)__p0, (int8x16_t)__p1, 42); 41422 return __ret; 41423 } 41424 #else 41425 __ai __attribute__((target("fp8,neon"))) float64x2_t vscaleq_f64(float64x2_t __p0, int64x2_t __p1) { 41426 float64x2_t __ret; 41427 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 41428 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 41429 __ret = (float64x2_t) __builtin_neon_vscaleq_f64((int8x16_t)__rev0, (int8x16_t)__rev1, 42); 41430 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 41431 return __ret; 41432 } 41433 #endif 41434 41435 #ifdef __LITTLE_ENDIAN__ 41436 __ai __attribute__((target("fp8,neon"))) float32x4_t vscaleq_f32(float32x4_t __p0, int32x4_t __p1) { 41437 float32x4_t __ret; 41438 __ret = (float32x4_t) __builtin_neon_vscaleq_f32((int8x16_t)__p0, (int8x16_t)__p1, 41); 41439 return __ret; 41440 } 41441 #else 41442 __ai __attribute__((target("fp8,neon"))) float32x4_t vscaleq_f32(float32x4_t __p0, int32x4_t __p1) { 41443 float32x4_t __ret; 41444 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 41445 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 41446 __ret = (float32x4_t) __builtin_neon_vscaleq_f32((int8x16_t)__rev0, (int8x16_t)__rev1, 41); 41447 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 41448 return __ret; 41449 } 41450 #endif 41451 41452 #ifdef __LITTLE_ENDIAN__ 41453 __ai __attribute__((target("fp8,neon"))) float16x8_t vscaleq_f16(float16x8_t __p0, int16x8_t __p1) { 41454 float16x8_t __ret; 41455 __ret = (float16x8_t) __builtin_neon_vscaleq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40); 41456 return __ret; 41457 } 41458 #else 41459 __ai __attribute__((target("fp8,neon"))) float16x8_t vscaleq_f16(float16x8_t __p0, int16x8_t __p1) { 41460 float16x8_t __ret; 41461 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 41462 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 41463 __ret = (float16x8_t) __builtin_neon_vscaleq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40); 41464 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 41465 return __ret; 41466 } 41467 #endif 41468 41469 #ifdef __LITTLE_ENDIAN__ 41470 __ai __attribute__((target("fp8dot2,neon"))) float16x8_t vdotq_f16_mf8_fpm(float16x8_t __p0, mfloat8x16_t __p1, mfloat8x16_t __p2, fpm_t __p3) { 41471 float16x8_t __ret; 41472 __ret = (float16x8_t) __builtin_neon_vdotq_f16_mf8_fpm((int8x16_t)__p0, __p1, __p2, __p3); 41473 return __ret; 41474 } 41475 #else 41476 __ai __attribute__((target("fp8dot2,neon"))) float16x8_t vdotq_f16_mf8_fpm(float16x8_t __p0, mfloat8x16_t __p1, mfloat8x16_t __p2, fpm_t __p3) { 41477 float16x8_t __ret; 41478 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 41479 mfloat8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 41480 mfloat8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 41481 __ret = (float16x8_t) __builtin_neon_vdotq_f16_mf8_fpm((int8x16_t)__rev0, __rev1, __rev2, __p3); 41482 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 41483 return __ret; 41484 } 41485 #endif 41486 41487 #ifdef __LITTLE_ENDIAN__ 41488 __ai __attribute__((target("fp8dot2,neon"))) float16x4_t vdot_f16_mf8_fpm(float16x4_t __p0, mfloat8x8_t __p1, mfloat8x8_t __p2, fpm_t __p3) { 41489 float16x4_t __ret; 41490 __ret = (float16x4_t) __builtin_neon_vdot_f16_mf8_fpm((int8x8_t)__p0, __p1, __p2, __p3); 41491 return __ret; 41492 } 41493 #else 41494 __ai __attribute__((target("fp8dot2,neon"))) float16x4_t vdot_f16_mf8_fpm(float16x4_t __p0, mfloat8x8_t __p1, mfloat8x8_t __p2, fpm_t __p3) { 41495 float16x4_t __ret; 41496 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 41497 mfloat8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 41498 mfloat8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 41499 __ret = (float16x4_t) __builtin_neon_vdot_f16_mf8_fpm((int8x8_t)__rev0, __rev1, __rev2, __p3); 41500 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 41501 return __ret; 41502 } 41503 #endif 41504 41505 #ifdef __LITTLE_ENDIAN__ 41506 #define vdotq_lane_f16_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 41507 float16x8_t __ret; \ 41508 float16x8_t __s0 = __p0; \ 41509 mfloat8x16_t __s1 = __p1; \ 41510 mfloat8x8_t __s2 = __p2; \ 41511 fpm_t __s4 = __p4; \ 41512 __ret = (float16x8_t) __builtin_neon_vdotq_lane_f16_mf8_fpm((int8x16_t)__s0, __s1, __s2, __p3, __s4); \ 41513 __ret; \ 41514 }) 41515 #else 41516 #define vdotq_lane_f16_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 41517 float16x8_t __ret; \ 41518 float16x8_t __s0 = __p0; \ 41519 mfloat8x16_t __s1 = __p1; \ 41520 mfloat8x8_t __s2 = __p2; \ 41521 fpm_t __s4 = __p4; \ 41522 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 41523 mfloat8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 41524 mfloat8x8_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 7, 6, 5, 4, 3, 2, 1, 0); \ 41525 __ret = (float16x8_t) __builtin_neon_vdotq_lane_f16_mf8_fpm((int8x16_t)__rev0, __rev1, __rev2, __p3, __s4); \ 41526 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 41527 __ret; \ 41528 }) 41529 #endif 41530 41531 #ifdef __LITTLE_ENDIAN__ 41532 #define vdot_lane_f16_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 41533 float16x4_t __ret; \ 41534 float16x4_t __s0 = __p0; \ 41535 mfloat8x8_t __s1 = __p1; \ 41536 mfloat8x8_t __s2 = __p2; \ 41537 fpm_t __s4 = __p4; \ 41538 __ret = (float16x4_t) __builtin_neon_vdot_lane_f16_mf8_fpm((int8x8_t)__s0, __s1, __s2, __p3, __s4); \ 41539 __ret; \ 41540 }) 41541 #else 41542 #define vdot_lane_f16_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 41543 float16x4_t __ret; \ 41544 float16x4_t __s0 = __p0; \ 41545 mfloat8x8_t __s1 = __p1; \ 41546 mfloat8x8_t __s2 = __p2; \ 41547 fpm_t __s4 = __p4; \ 41548 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 41549 mfloat8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 41550 mfloat8x8_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 7, 6, 5, 4, 3, 2, 1, 0); \ 41551 __ret = (float16x4_t) __builtin_neon_vdot_lane_f16_mf8_fpm((int8x8_t)__rev0, __rev1, __rev2, __p3, __s4); \ 41552 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 41553 __ret; \ 41554 }) 41555 #endif 41556 41557 #ifdef __LITTLE_ENDIAN__ 41558 #define vdotq_laneq_f16_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 41559 float16x8_t __ret; \ 41560 float16x8_t __s0 = __p0; \ 41561 mfloat8x16_t __s1 = __p1; \ 41562 mfloat8x16_t __s2 = __p2; \ 41563 fpm_t __s4 = __p4; \ 41564 __ret = (float16x8_t) __builtin_neon_vdotq_laneq_f16_mf8_fpm((int8x16_t)__s0, __s1, __s2, __p3, __s4); \ 41565 __ret; \ 41566 }) 41567 #else 41568 #define vdotq_laneq_f16_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 41569 float16x8_t __ret; \ 41570 float16x8_t __s0 = __p0; \ 41571 mfloat8x16_t __s1 = __p1; \ 41572 mfloat8x16_t __s2 = __p2; \ 41573 fpm_t __s4 = __p4; \ 41574 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 41575 mfloat8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 41576 mfloat8x16_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 41577 __ret = (float16x8_t) __builtin_neon_vdotq_laneq_f16_mf8_fpm((int8x16_t)__rev0, __rev1, __rev2, __p3, __s4); \ 41578 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 41579 __ret; \ 41580 }) 41581 #endif 41582 41583 #ifdef __LITTLE_ENDIAN__ 41584 #define vdot_laneq_f16_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 41585 float16x4_t __ret; \ 41586 float16x4_t __s0 = __p0; \ 41587 mfloat8x8_t __s1 = __p1; \ 41588 mfloat8x16_t __s2 = __p2; \ 41589 fpm_t __s4 = __p4; \ 41590 __ret = (float16x4_t) __builtin_neon_vdot_laneq_f16_mf8_fpm((int8x8_t)__s0, __s1, __s2, __p3, __s4); \ 41591 __ret; \ 41592 }) 41593 #else 41594 #define vdot_laneq_f16_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 41595 float16x4_t __ret; \ 41596 float16x4_t __s0 = __p0; \ 41597 mfloat8x8_t __s1 = __p1; \ 41598 mfloat8x16_t __s2 = __p2; \ 41599 fpm_t __s4 = __p4; \ 41600 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 41601 mfloat8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 41602 mfloat8x16_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 41603 __ret = (float16x4_t) __builtin_neon_vdot_laneq_f16_mf8_fpm((int8x8_t)__rev0, __rev1, __rev2, __p3, __s4); \ 41604 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 41605 __ret; \ 41606 }) 41607 #endif 41608 41609 #ifdef __LITTLE_ENDIAN__ 41610 __ai __attribute__((target("fp8dot4,neon"))) float32x4_t vdotq_f32_mf8_fpm(float32x4_t __p0, mfloat8x16_t __p1, mfloat8x16_t __p2, fpm_t __p3) { 41611 float32x4_t __ret; 41612 __ret = (float32x4_t) __builtin_neon_vdotq_f32_mf8_fpm(__p0, __p1, __p2, __p3); 41613 return __ret; 41614 } 41615 #else 41616 __ai __attribute__((target("fp8dot4,neon"))) float32x4_t vdotq_f32_mf8_fpm(float32x4_t __p0, mfloat8x16_t __p1, mfloat8x16_t __p2, fpm_t __p3) { 41617 float32x4_t __ret; 41618 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 41619 mfloat8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 41620 mfloat8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 41621 __ret = (float32x4_t) __builtin_neon_vdotq_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3); 41622 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 41623 return __ret; 41624 } 41625 #endif 41626 41627 #ifdef __LITTLE_ENDIAN__ 41628 __ai __attribute__((target("fp8dot4,neon"))) float32x2_t vdot_f32_mf8_fpm(float32x2_t __p0, mfloat8x8_t __p1, mfloat8x8_t __p2, fpm_t __p3) { 41629 float32x2_t __ret; 41630 __ret = (float32x2_t) __builtin_neon_vdot_f32_mf8_fpm(__p0, __p1, __p2, __p3); 41631 return __ret; 41632 } 41633 #else 41634 __ai __attribute__((target("fp8dot4,neon"))) float32x2_t vdot_f32_mf8_fpm(float32x2_t __p0, mfloat8x8_t __p1, mfloat8x8_t __p2, fpm_t __p3) { 41635 float32x2_t __ret; 41636 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 41637 mfloat8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 41638 mfloat8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 41639 __ret = (float32x2_t) __builtin_neon_vdot_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3); 41640 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 41641 return __ret; 41642 } 41643 #endif 41644 41645 #ifdef __LITTLE_ENDIAN__ 41646 #define vdotq_lane_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 41647 float32x4_t __ret; \ 41648 float32x4_t __s0 = __p0; \ 41649 mfloat8x16_t __s1 = __p1; \ 41650 mfloat8x8_t __s2 = __p2; \ 41651 fpm_t __s4 = __p4; \ 41652 __ret = (float32x4_t) __builtin_neon_vdotq_lane_f32_mf8_fpm(__s0, __s1, __s2, __p3, __s4); \ 41653 __ret; \ 41654 }) 41655 #else 41656 #define vdotq_lane_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 41657 float32x4_t __ret; \ 41658 float32x4_t __s0 = __p0; \ 41659 mfloat8x16_t __s1 = __p1; \ 41660 mfloat8x8_t __s2 = __p2; \ 41661 fpm_t __s4 = __p4; \ 41662 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 41663 mfloat8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 41664 mfloat8x8_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 7, 6, 5, 4, 3, 2, 1, 0); \ 41665 __ret = (float32x4_t) __builtin_neon_vdotq_lane_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3, __s4); \ 41666 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 41667 __ret; \ 41668 }) 41669 #endif 41670 41671 #ifdef __LITTLE_ENDIAN__ 41672 #define vdot_lane_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 41673 float32x2_t __ret; \ 41674 float32x2_t __s0 = __p0; \ 41675 mfloat8x8_t __s1 = __p1; \ 41676 mfloat8x8_t __s2 = __p2; \ 41677 fpm_t __s4 = __p4; \ 41678 __ret = (float32x2_t) __builtin_neon_vdot_lane_f32_mf8_fpm(__s0, __s1, __s2, __p3, __s4); \ 41679 __ret; \ 41680 }) 41681 #else 41682 #define vdot_lane_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 41683 float32x2_t __ret; \ 41684 float32x2_t __s0 = __p0; \ 41685 mfloat8x8_t __s1 = __p1; \ 41686 mfloat8x8_t __s2 = __p2; \ 41687 fpm_t __s4 = __p4; \ 41688 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 41689 mfloat8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 41690 mfloat8x8_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 7, 6, 5, 4, 3, 2, 1, 0); \ 41691 __ret = (float32x2_t) __builtin_neon_vdot_lane_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3, __s4); \ 41692 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 41693 __ret; \ 41694 }) 41695 #endif 41696 41697 #ifdef __LITTLE_ENDIAN__ 41698 #define vdotq_laneq_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 41699 float32x4_t __ret; \ 41700 float32x4_t __s0 = __p0; \ 41701 mfloat8x16_t __s1 = __p1; \ 41702 mfloat8x16_t __s2 = __p2; \ 41703 fpm_t __s4 = __p4; \ 41704 __ret = (float32x4_t) __builtin_neon_vdotq_laneq_f32_mf8_fpm(__s0, __s1, __s2, __p3, __s4); \ 41705 __ret; \ 41706 }) 41707 #else 41708 #define vdotq_laneq_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 41709 float32x4_t __ret; \ 41710 float32x4_t __s0 = __p0; \ 41711 mfloat8x16_t __s1 = __p1; \ 41712 mfloat8x16_t __s2 = __p2; \ 41713 fpm_t __s4 = __p4; \ 41714 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 41715 mfloat8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 41716 mfloat8x16_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 41717 __ret = (float32x4_t) __builtin_neon_vdotq_laneq_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3, __s4); \ 41718 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 41719 __ret; \ 41720 }) 41721 #endif 41722 41723 #ifdef __LITTLE_ENDIAN__ 41724 #define vdot_laneq_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 41725 float32x2_t __ret; \ 41726 float32x2_t __s0 = __p0; \ 41727 mfloat8x8_t __s1 = __p1; \ 41728 mfloat8x16_t __s2 = __p2; \ 41729 fpm_t __s4 = __p4; \ 41730 __ret = (float32x2_t) __builtin_neon_vdot_laneq_f32_mf8_fpm(__s0, __s1, __s2, __p3, __s4); \ 41731 __ret; \ 41732 }) 41733 #else 41734 #define vdot_laneq_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 41735 float32x2_t __ret; \ 41736 float32x2_t __s0 = __p0; \ 41737 mfloat8x8_t __s1 = __p1; \ 41738 mfloat8x16_t __s2 = __p2; \ 41739 fpm_t __s4 = __p4; \ 41740 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 41741 mfloat8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 41742 mfloat8x16_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 41743 __ret = (float32x2_t) __builtin_neon_vdot_laneq_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3, __s4); \ 41744 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 41745 __ret; \ 41746 }) 41747 #endif 41748 41749 #ifdef __LITTLE_ENDIAN__ 41750 __ai __attribute__((target("fp8fma,neon"))) float16x8_t vmlalbq_f16_mf8_fpm(float16x8_t __p0, mfloat8x16_t __p1, mfloat8x16_t __p2, fpm_t __p3) { 41751 float16x8_t __ret; 41752 __ret = (float16x8_t) __builtin_neon_vmlalbq_f16_mf8_fpm((int8x16_t)__p0, __p1, __p2, __p3); 41753 return __ret; 41754 } 41755 #else 41756 __ai __attribute__((target("fp8fma,neon"))) float16x8_t vmlalbq_f16_mf8_fpm(float16x8_t __p0, mfloat8x16_t __p1, mfloat8x16_t __p2, fpm_t __p3) { 41757 float16x8_t __ret; 41758 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 41759 mfloat8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 41760 mfloat8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 41761 __ret = (float16x8_t) __builtin_neon_vmlalbq_f16_mf8_fpm((int8x16_t)__rev0, __rev1, __rev2, __p3); 41762 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 41763 return __ret; 41764 } 41765 #endif 41766 41767 #ifdef __LITTLE_ENDIAN__ 41768 #define vmlalbq_lane_f16_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 41769 float16x8_t __ret; \ 41770 float16x8_t __s0 = __p0; \ 41771 mfloat8x16_t __s1 = __p1; \ 41772 mfloat8x8_t __s2 = __p2; \ 41773 fpm_t __s4 = __p4; \ 41774 __ret = (float16x8_t) __builtin_neon_vmlalbq_lane_f16_mf8_fpm((int8x16_t)__s0, __s1, __s2, __p3, __s4); \ 41775 __ret; \ 41776 }) 41777 #else 41778 #define vmlalbq_lane_f16_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 41779 float16x8_t __ret; \ 41780 float16x8_t __s0 = __p0; \ 41781 mfloat8x16_t __s1 = __p1; \ 41782 mfloat8x8_t __s2 = __p2; \ 41783 fpm_t __s4 = __p4; \ 41784 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 41785 mfloat8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 41786 mfloat8x8_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 7, 6, 5, 4, 3, 2, 1, 0); \ 41787 __ret = (float16x8_t) __builtin_neon_vmlalbq_lane_f16_mf8_fpm((int8x16_t)__rev0, __rev1, __rev2, __p3, __s4); \ 41788 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 41789 __ret; \ 41790 }) 41791 #endif 41792 41793 #ifdef __LITTLE_ENDIAN__ 41794 #define vmlalbq_laneq_f16_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 41795 float16x8_t __ret; \ 41796 float16x8_t __s0 = __p0; \ 41797 mfloat8x16_t __s1 = __p1; \ 41798 mfloat8x16_t __s2 = __p2; \ 41799 fpm_t __s4 = __p4; \ 41800 __ret = (float16x8_t) __builtin_neon_vmlalbq_laneq_f16_mf8_fpm((int8x16_t)__s0, __s1, __s2, __p3, __s4); \ 41801 __ret; \ 41802 }) 41803 #else 41804 #define vmlalbq_laneq_f16_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 41805 float16x8_t __ret; \ 41806 float16x8_t __s0 = __p0; \ 41807 mfloat8x16_t __s1 = __p1; \ 41808 mfloat8x16_t __s2 = __p2; \ 41809 fpm_t __s4 = __p4; \ 41810 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 41811 mfloat8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 41812 mfloat8x16_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 41813 __ret = (float16x8_t) __builtin_neon_vmlalbq_laneq_f16_mf8_fpm((int8x16_t)__rev0, __rev1, __rev2, __p3, __s4); \ 41814 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 41815 __ret; \ 41816 }) 41817 #endif 41818 41819 #ifdef __LITTLE_ENDIAN__ 41820 __ai __attribute__((target("fp8fma,neon"))) float32x4_t vmlallbbq_f32_mf8_fpm(float32x4_t __p0, mfloat8x16_t __p1, mfloat8x16_t __p2, fpm_t __p3) { 41821 float32x4_t __ret; 41822 __ret = (float32x4_t) __builtin_neon_vmlallbbq_f32_mf8_fpm(__p0, __p1, __p2, __p3); 41823 return __ret; 41824 } 41825 #else 41826 __ai __attribute__((target("fp8fma,neon"))) float32x4_t vmlallbbq_f32_mf8_fpm(float32x4_t __p0, mfloat8x16_t __p1, mfloat8x16_t __p2, fpm_t __p3) { 41827 float32x4_t __ret; 41828 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 41829 mfloat8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 41830 mfloat8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 41831 __ret = (float32x4_t) __builtin_neon_vmlallbbq_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3); 41832 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 41833 return __ret; 41834 } 41835 #endif 41836 41837 #ifdef __LITTLE_ENDIAN__ 41838 #define vmlallbbq_lane_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 41839 float32x4_t __ret; \ 41840 float32x4_t __s0 = __p0; \ 41841 mfloat8x16_t __s1 = __p1; \ 41842 mfloat8x8_t __s2 = __p2; \ 41843 fpm_t __s4 = __p4; \ 41844 __ret = (float32x4_t) __builtin_neon_vmlallbbq_lane_f32_mf8_fpm(__s0, __s1, __s2, __p3, __s4); \ 41845 __ret; \ 41846 }) 41847 #else 41848 #define vmlallbbq_lane_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 41849 float32x4_t __ret; \ 41850 float32x4_t __s0 = __p0; \ 41851 mfloat8x16_t __s1 = __p1; \ 41852 mfloat8x8_t __s2 = __p2; \ 41853 fpm_t __s4 = __p4; \ 41854 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 41855 mfloat8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 41856 mfloat8x8_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 7, 6, 5, 4, 3, 2, 1, 0); \ 41857 __ret = (float32x4_t) __builtin_neon_vmlallbbq_lane_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3, __s4); \ 41858 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 41859 __ret; \ 41860 }) 41861 #endif 41862 41863 #ifdef __LITTLE_ENDIAN__ 41864 #define vmlallbbq_laneq_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 41865 float32x4_t __ret; \ 41866 float32x4_t __s0 = __p0; \ 41867 mfloat8x16_t __s1 = __p1; \ 41868 mfloat8x16_t __s2 = __p2; \ 41869 fpm_t __s4 = __p4; \ 41870 __ret = (float32x4_t) __builtin_neon_vmlallbbq_laneq_f32_mf8_fpm(__s0, __s1, __s2, __p3, __s4); \ 41871 __ret; \ 41872 }) 41873 #else 41874 #define vmlallbbq_laneq_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 41875 float32x4_t __ret; \ 41876 float32x4_t __s0 = __p0; \ 41877 mfloat8x16_t __s1 = __p1; \ 41878 mfloat8x16_t __s2 = __p2; \ 41879 fpm_t __s4 = __p4; \ 41880 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 41881 mfloat8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 41882 mfloat8x16_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 41883 __ret = (float32x4_t) __builtin_neon_vmlallbbq_laneq_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3, __s4); \ 41884 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 41885 __ret; \ 41886 }) 41887 #endif 41888 41889 #ifdef __LITTLE_ENDIAN__ 41890 __ai __attribute__((target("fp8fma,neon"))) float32x4_t vmlallbtq_f32_mf8_fpm(float32x4_t __p0, mfloat8x16_t __p1, mfloat8x16_t __p2, fpm_t __p3) { 41891 float32x4_t __ret; 41892 __ret = (float32x4_t) __builtin_neon_vmlallbtq_f32_mf8_fpm(__p0, __p1, __p2, __p3); 41893 return __ret; 41894 } 41895 #else 41896 __ai __attribute__((target("fp8fma,neon"))) float32x4_t vmlallbtq_f32_mf8_fpm(float32x4_t __p0, mfloat8x16_t __p1, mfloat8x16_t __p2, fpm_t __p3) { 41897 float32x4_t __ret; 41898 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 41899 mfloat8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 41900 mfloat8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 41901 __ret = (float32x4_t) __builtin_neon_vmlallbtq_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3); 41902 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 41903 return __ret; 41904 } 41905 #endif 41906 41907 #ifdef __LITTLE_ENDIAN__ 41908 #define vmlallbtq_lane_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 41909 float32x4_t __ret; \ 41910 float32x4_t __s0 = __p0; \ 41911 mfloat8x16_t __s1 = __p1; \ 41912 mfloat8x8_t __s2 = __p2; \ 41913 fpm_t __s4 = __p4; \ 41914 __ret = (float32x4_t) __builtin_neon_vmlallbtq_lane_f32_mf8_fpm(__s0, __s1, __s2, __p3, __s4); \ 41915 __ret; \ 41916 }) 41917 #else 41918 #define vmlallbtq_lane_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 41919 float32x4_t __ret; \ 41920 float32x4_t __s0 = __p0; \ 41921 mfloat8x16_t __s1 = __p1; \ 41922 mfloat8x8_t __s2 = __p2; \ 41923 fpm_t __s4 = __p4; \ 41924 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 41925 mfloat8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 41926 mfloat8x8_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 7, 6, 5, 4, 3, 2, 1, 0); \ 41927 __ret = (float32x4_t) __builtin_neon_vmlallbtq_lane_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3, __s4); \ 41928 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 41929 __ret; \ 41930 }) 41931 #endif 41932 41933 #ifdef __LITTLE_ENDIAN__ 41934 #define vmlallbtq_laneq_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 41935 float32x4_t __ret; \ 41936 float32x4_t __s0 = __p0; \ 41937 mfloat8x16_t __s1 = __p1; \ 41938 mfloat8x16_t __s2 = __p2; \ 41939 fpm_t __s4 = __p4; \ 41940 __ret = (float32x4_t) __builtin_neon_vmlallbtq_laneq_f32_mf8_fpm(__s0, __s1, __s2, __p3, __s4); \ 41941 __ret; \ 41942 }) 41943 #else 41944 #define vmlallbtq_laneq_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 41945 float32x4_t __ret; \ 41946 float32x4_t __s0 = __p0; \ 41947 mfloat8x16_t __s1 = __p1; \ 41948 mfloat8x16_t __s2 = __p2; \ 41949 fpm_t __s4 = __p4; \ 41950 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 41951 mfloat8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 41952 mfloat8x16_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 41953 __ret = (float32x4_t) __builtin_neon_vmlallbtq_laneq_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3, __s4); \ 41954 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 41955 __ret; \ 41956 }) 41957 #endif 41958 41959 #ifdef __LITTLE_ENDIAN__ 41960 __ai __attribute__((target("fp8fma,neon"))) float32x4_t vmlalltbq_f32_mf8_fpm(float32x4_t __p0, mfloat8x16_t __p1, mfloat8x16_t __p2, fpm_t __p3) { 41961 float32x4_t __ret; 41962 __ret = (float32x4_t) __builtin_neon_vmlalltbq_f32_mf8_fpm(__p0, __p1, __p2, __p3); 41963 return __ret; 41964 } 41965 #else 41966 __ai __attribute__((target("fp8fma,neon"))) float32x4_t vmlalltbq_f32_mf8_fpm(float32x4_t __p0, mfloat8x16_t __p1, mfloat8x16_t __p2, fpm_t __p3) { 41967 float32x4_t __ret; 41968 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 41969 mfloat8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 41970 mfloat8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 41971 __ret = (float32x4_t) __builtin_neon_vmlalltbq_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3); 41972 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 41973 return __ret; 41974 } 41975 #endif 41976 41977 #ifdef __LITTLE_ENDIAN__ 41978 #define vmlalltbq_lane_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 41979 float32x4_t __ret; \ 41980 float32x4_t __s0 = __p0; \ 41981 mfloat8x16_t __s1 = __p1; \ 41982 mfloat8x8_t __s2 = __p2; \ 41983 fpm_t __s4 = __p4; \ 41984 __ret = (float32x4_t) __builtin_neon_vmlalltbq_lane_f32_mf8_fpm(__s0, __s1, __s2, __p3, __s4); \ 41985 __ret; \ 41986 }) 41987 #else 41988 #define vmlalltbq_lane_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 41989 float32x4_t __ret; \ 41990 float32x4_t __s0 = __p0; \ 41991 mfloat8x16_t __s1 = __p1; \ 41992 mfloat8x8_t __s2 = __p2; \ 41993 fpm_t __s4 = __p4; \ 41994 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 41995 mfloat8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 41996 mfloat8x8_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 7, 6, 5, 4, 3, 2, 1, 0); \ 41997 __ret = (float32x4_t) __builtin_neon_vmlalltbq_lane_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3, __s4); \ 41998 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 41999 __ret; \ 42000 }) 42001 #endif 42002 42003 #ifdef __LITTLE_ENDIAN__ 42004 #define vmlalltbq_laneq_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 42005 float32x4_t __ret; \ 42006 float32x4_t __s0 = __p0; \ 42007 mfloat8x16_t __s1 = __p1; \ 42008 mfloat8x16_t __s2 = __p2; \ 42009 fpm_t __s4 = __p4; \ 42010 __ret = (float32x4_t) __builtin_neon_vmlalltbq_laneq_f32_mf8_fpm(__s0, __s1, __s2, __p3, __s4); \ 42011 __ret; \ 42012 }) 42013 #else 42014 #define vmlalltbq_laneq_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 42015 float32x4_t __ret; \ 42016 float32x4_t __s0 = __p0; \ 42017 mfloat8x16_t __s1 = __p1; \ 42018 mfloat8x16_t __s2 = __p2; \ 42019 fpm_t __s4 = __p4; \ 42020 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 42021 mfloat8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42022 mfloat8x16_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42023 __ret = (float32x4_t) __builtin_neon_vmlalltbq_laneq_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3, __s4); \ 42024 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 42025 __ret; \ 42026 }) 42027 #endif 42028 42029 #ifdef __LITTLE_ENDIAN__ 42030 __ai __attribute__((target("fp8fma,neon"))) float32x4_t vmlallttq_f32_mf8_fpm(float32x4_t __p0, mfloat8x16_t __p1, mfloat8x16_t __p2, fpm_t __p3) { 42031 float32x4_t __ret; 42032 __ret = (float32x4_t) __builtin_neon_vmlallttq_f32_mf8_fpm(__p0, __p1, __p2, __p3); 42033 return __ret; 42034 } 42035 #else 42036 __ai __attribute__((target("fp8fma,neon"))) float32x4_t vmlallttq_f32_mf8_fpm(float32x4_t __p0, mfloat8x16_t __p1, mfloat8x16_t __p2, fpm_t __p3) { 42037 float32x4_t __ret; 42038 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 42039 mfloat8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 42040 mfloat8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 42041 __ret = (float32x4_t) __builtin_neon_vmlallttq_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3); 42042 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 42043 return __ret; 42044 } 42045 #endif 42046 42047 #ifdef __LITTLE_ENDIAN__ 42048 #define vmlallttq_lane_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 42049 float32x4_t __ret; \ 42050 float32x4_t __s0 = __p0; \ 42051 mfloat8x16_t __s1 = __p1; \ 42052 mfloat8x8_t __s2 = __p2; \ 42053 fpm_t __s4 = __p4; \ 42054 __ret = (float32x4_t) __builtin_neon_vmlallttq_lane_f32_mf8_fpm(__s0, __s1, __s2, __p3, __s4); \ 42055 __ret; \ 42056 }) 42057 #else 42058 #define vmlallttq_lane_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 42059 float32x4_t __ret; \ 42060 float32x4_t __s0 = __p0; \ 42061 mfloat8x16_t __s1 = __p1; \ 42062 mfloat8x8_t __s2 = __p2; \ 42063 fpm_t __s4 = __p4; \ 42064 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 42065 mfloat8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42066 mfloat8x8_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 7, 6, 5, 4, 3, 2, 1, 0); \ 42067 __ret = (float32x4_t) __builtin_neon_vmlallttq_lane_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3, __s4); \ 42068 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 42069 __ret; \ 42070 }) 42071 #endif 42072 42073 #ifdef __LITTLE_ENDIAN__ 42074 #define vmlallttq_laneq_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 42075 float32x4_t __ret; \ 42076 float32x4_t __s0 = __p0; \ 42077 mfloat8x16_t __s1 = __p1; \ 42078 mfloat8x16_t __s2 = __p2; \ 42079 fpm_t __s4 = __p4; \ 42080 __ret = (float32x4_t) __builtin_neon_vmlallttq_laneq_f32_mf8_fpm(__s0, __s1, __s2, __p3, __s4); \ 42081 __ret; \ 42082 }) 42083 #else 42084 #define vmlallttq_laneq_f32_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 42085 float32x4_t __ret; \ 42086 float32x4_t __s0 = __p0; \ 42087 mfloat8x16_t __s1 = __p1; \ 42088 mfloat8x16_t __s2 = __p2; \ 42089 fpm_t __s4 = __p4; \ 42090 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 42091 mfloat8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42092 mfloat8x16_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42093 __ret = (float32x4_t) __builtin_neon_vmlallttq_laneq_f32_mf8_fpm(__rev0, __rev1, __rev2, __p3, __s4); \ 42094 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 42095 __ret; \ 42096 }) 42097 #endif 42098 42099 #ifdef __LITTLE_ENDIAN__ 42100 __ai __attribute__((target("fp8fma,neon"))) float16x8_t vmlaltq_f16_mf8_fpm(float16x8_t __p0, mfloat8x16_t __p1, mfloat8x16_t __p2, fpm_t __p3) { 42101 float16x8_t __ret; 42102 __ret = (float16x8_t) __builtin_neon_vmlaltq_f16_mf8_fpm((int8x16_t)__p0, __p1, __p2, __p3); 42103 return __ret; 42104 } 42105 #else 42106 __ai __attribute__((target("fp8fma,neon"))) float16x8_t vmlaltq_f16_mf8_fpm(float16x8_t __p0, mfloat8x16_t __p1, mfloat8x16_t __p2, fpm_t __p3) { 42107 float16x8_t __ret; 42108 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 42109 mfloat8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 42110 mfloat8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 42111 __ret = (float16x8_t) __builtin_neon_vmlaltq_f16_mf8_fpm((int8x16_t)__rev0, __rev1, __rev2, __p3); 42112 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 42113 return __ret; 42114 } 42115 #endif 42116 42117 #ifdef __LITTLE_ENDIAN__ 42118 #define vmlaltq_lane_f16_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 42119 float16x8_t __ret; \ 42120 float16x8_t __s0 = __p0; \ 42121 mfloat8x16_t __s1 = __p1; \ 42122 mfloat8x8_t __s2 = __p2; \ 42123 fpm_t __s4 = __p4; \ 42124 __ret = (float16x8_t) __builtin_neon_vmlaltq_lane_f16_mf8_fpm((int8x16_t)__s0, __s1, __s2, __p3, __s4); \ 42125 __ret; \ 42126 }) 42127 #else 42128 #define vmlaltq_lane_f16_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 42129 float16x8_t __ret; \ 42130 float16x8_t __s0 = __p0; \ 42131 mfloat8x16_t __s1 = __p1; \ 42132 mfloat8x8_t __s2 = __p2; \ 42133 fpm_t __s4 = __p4; \ 42134 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 42135 mfloat8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42136 mfloat8x8_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 7, 6, 5, 4, 3, 2, 1, 0); \ 42137 __ret = (float16x8_t) __builtin_neon_vmlaltq_lane_f16_mf8_fpm((int8x16_t)__rev0, __rev1, __rev2, __p3, __s4); \ 42138 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 42139 __ret; \ 42140 }) 42141 #endif 42142 42143 #ifdef __LITTLE_ENDIAN__ 42144 #define vmlaltq_laneq_f16_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 42145 float16x8_t __ret; \ 42146 float16x8_t __s0 = __p0; \ 42147 mfloat8x16_t __s1 = __p1; \ 42148 mfloat8x16_t __s2 = __p2; \ 42149 fpm_t __s4 = __p4; \ 42150 __ret = (float16x8_t) __builtin_neon_vmlaltq_laneq_f16_mf8_fpm((int8x16_t)__s0, __s1, __s2, __p3, __s4); \ 42151 __ret; \ 42152 }) 42153 #else 42154 #define vmlaltq_laneq_f16_mf8_fpm(__p0, __p1, __p2, __p3, __p4) __extension__ ({ \ 42155 float16x8_t __ret; \ 42156 float16x8_t __s0 = __p0; \ 42157 mfloat8x16_t __s1 = __p1; \ 42158 mfloat8x16_t __s2 = __p2; \ 42159 fpm_t __s4 = __p4; \ 42160 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 42161 mfloat8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42162 mfloat8x16_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42163 __ret = (float16x8_t) __builtin_neon_vmlaltq_laneq_f16_mf8_fpm((int8x16_t)__rev0, __rev1, __rev2, __p3, __s4); \ 42164 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 42165 __ret; \ 42166 }) 42167 #endif 42168 42169 #ifdef __LITTLE_ENDIAN__ 42170 #define vluti2_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 42171 poly8x16_t __ret; \ 42172 poly8x8_t __s0 = __p0; \ 42173 uint8x8_t __s1 = __p1; \ 42174 __ret = (poly8x16_t) __builtin_neon_vluti2_lane_p8((int8x8_t)__s0, (int8x8_t)__s1, __p2, 36); \ 42175 __ret; \ 42176 }) 42177 #else 42178 #define vluti2_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 42179 poly8x16_t __ret; \ 42180 poly8x8_t __s0 = __p0; \ 42181 uint8x8_t __s1 = __p1; \ 42182 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 42183 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 42184 __ret = (poly8x16_t) __builtin_neon_vluti2_lane_p8((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 36); \ 42185 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42186 __ret; \ 42187 }) 42188 #endif 42189 42190 #ifdef __LITTLE_ENDIAN__ 42191 #define vluti2q_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 42192 poly8x16_t __ret; \ 42193 poly8x16_t __s0 = __p0; \ 42194 uint8x8_t __s1 = __p1; \ 42195 __ret = (poly8x16_t) __builtin_neon_vluti2q_lane_p8((int8x16_t)__s0, (int8x8_t)__s1, __p2, 36); \ 42196 __ret; \ 42197 }) 42198 #else 42199 #define vluti2q_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 42200 poly8x16_t __ret; \ 42201 poly8x16_t __s0 = __p0; \ 42202 uint8x8_t __s1 = __p1; \ 42203 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42204 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 42205 __ret = (poly8x16_t) __builtin_neon_vluti2q_lane_p8((int8x16_t)__rev0, (int8x8_t)__rev1, __p2, 36); \ 42206 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42207 __ret; \ 42208 }) 42209 #endif 42210 42211 #ifdef __LITTLE_ENDIAN__ 42212 #define vluti2q_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 42213 uint8x16_t __ret; \ 42214 uint8x16_t __s0 = __p0; \ 42215 uint8x8_t __s1 = __p1; \ 42216 __ret = (uint8x16_t) __builtin_neon_vluti2q_lane_u8((int8x16_t)__s0, (int8x8_t)__s1, __p2, 48); \ 42217 __ret; \ 42218 }) 42219 #else 42220 #define vluti2q_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 42221 uint8x16_t __ret; \ 42222 uint8x16_t __s0 = __p0; \ 42223 uint8x8_t __s1 = __p1; \ 42224 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42225 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 42226 __ret = (uint8x16_t) __builtin_neon_vluti2q_lane_u8((int8x16_t)__rev0, (int8x8_t)__rev1, __p2, 48); \ 42227 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42228 __ret; \ 42229 }) 42230 #endif 42231 42232 #ifdef __LITTLE_ENDIAN__ 42233 #define vluti2q_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 42234 int8x16_t __ret; \ 42235 int8x16_t __s0 = __p0; \ 42236 uint8x8_t __s1 = __p1; \ 42237 __ret = (int8x16_t) __builtin_neon_vluti2q_lane_s8((int8x16_t)__s0, (int8x8_t)__s1, __p2, 32); \ 42238 __ret; \ 42239 }) 42240 #else 42241 #define vluti2q_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 42242 int8x16_t __ret; \ 42243 int8x16_t __s0 = __p0; \ 42244 uint8x8_t __s1 = __p1; \ 42245 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42246 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 42247 __ret = (int8x16_t) __builtin_neon_vluti2q_lane_s8((int8x16_t)__rev0, (int8x8_t)__rev1, __p2, 32); \ 42248 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42249 __ret; \ 42250 }) 42251 #endif 42252 42253 #ifdef __LITTLE_ENDIAN__ 42254 #define vluti2_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 42255 uint8x16_t __ret; \ 42256 uint8x8_t __s0 = __p0; \ 42257 uint8x8_t __s1 = __p1; \ 42258 __ret = (uint8x16_t) __builtin_neon_vluti2_lane_u8((int8x8_t)__s0, (int8x8_t)__s1, __p2, 48); \ 42259 __ret; \ 42260 }) 42261 #else 42262 #define vluti2_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 42263 uint8x16_t __ret; \ 42264 uint8x8_t __s0 = __p0; \ 42265 uint8x8_t __s1 = __p1; \ 42266 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 42267 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 42268 __ret = (uint8x16_t) __builtin_neon_vluti2_lane_u8((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 48); \ 42269 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42270 __ret; \ 42271 }) 42272 #endif 42273 42274 #ifdef __LITTLE_ENDIAN__ 42275 #define vluti2_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 42276 int8x16_t __ret; \ 42277 int8x8_t __s0 = __p0; \ 42278 uint8x8_t __s1 = __p1; \ 42279 __ret = (int8x16_t) __builtin_neon_vluti2_lane_s8((int8x8_t)__s0, (int8x8_t)__s1, __p2, 32); \ 42280 __ret; \ 42281 }) 42282 #else 42283 #define vluti2_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 42284 int8x16_t __ret; \ 42285 int8x8_t __s0 = __p0; \ 42286 uint8x8_t __s1 = __p1; \ 42287 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 42288 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 42289 __ret = (int8x16_t) __builtin_neon_vluti2_lane_s8((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 32); \ 42290 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42291 __ret; \ 42292 }) 42293 #endif 42294 42295 #ifdef __LITTLE_ENDIAN__ 42296 #define vluti2_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 42297 poly16x8_t __ret; \ 42298 poly16x4_t __s0 = __p0; \ 42299 uint8x8_t __s1 = __p1; \ 42300 __ret = (poly16x8_t) __builtin_neon_vluti2_lane_p16((int8x8_t)__s0, (int8x8_t)__s1, __p2, 37); \ 42301 __ret; \ 42302 }) 42303 #else 42304 #define vluti2_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 42305 poly16x8_t __ret; \ 42306 poly16x4_t __s0 = __p0; \ 42307 uint8x8_t __s1 = __p1; \ 42308 poly16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 42309 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 42310 __ret = (poly16x8_t) __builtin_neon_vluti2_lane_p16((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 37); \ 42311 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 42312 __ret; \ 42313 }) 42314 #endif 42315 42316 #ifdef __LITTLE_ENDIAN__ 42317 #define vluti2q_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 42318 poly16x8_t __ret; \ 42319 poly16x8_t __s0 = __p0; \ 42320 uint8x8_t __s1 = __p1; \ 42321 __ret = (poly16x8_t) __builtin_neon_vluti2q_lane_p16((int8x16_t)__s0, (int8x8_t)__s1, __p2, 37); \ 42322 __ret; \ 42323 }) 42324 #else 42325 #define vluti2q_lane_p16(__p0, __p1, __p2) __extension__ ({ \ 42326 poly16x8_t __ret; \ 42327 poly16x8_t __s0 = __p0; \ 42328 uint8x8_t __s1 = __p1; \ 42329 poly16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 42330 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 42331 __ret = (poly16x8_t) __builtin_neon_vluti2q_lane_p16((int8x16_t)__rev0, (int8x8_t)__rev1, __p2, 37); \ 42332 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 42333 __ret; \ 42334 }) 42335 #endif 42336 42337 #ifdef __LITTLE_ENDIAN__ 42338 #define vluti2q_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 42339 uint16x8_t __ret; \ 42340 uint16x8_t __s0 = __p0; \ 42341 uint8x8_t __s1 = __p1; \ 42342 __ret = (uint16x8_t) __builtin_neon_vluti2q_lane_u16((int8x16_t)__s0, (int8x8_t)__s1, __p2, 49); \ 42343 __ret; \ 42344 }) 42345 #else 42346 #define vluti2q_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 42347 uint16x8_t __ret; \ 42348 uint16x8_t __s0 = __p0; \ 42349 uint8x8_t __s1 = __p1; \ 42350 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 42351 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 42352 __ret = (uint16x8_t) __builtin_neon_vluti2q_lane_u16((int8x16_t)__rev0, (int8x8_t)__rev1, __p2, 49); \ 42353 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 42354 __ret; \ 42355 }) 42356 #endif 42357 42358 #ifdef __LITTLE_ENDIAN__ 42359 #define vluti2q_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 42360 float16x8_t __ret; \ 42361 float16x8_t __s0 = __p0; \ 42362 uint8x8_t __s1 = __p1; \ 42363 __ret = (float16x8_t) __builtin_neon_vluti2q_lane_f16((int8x16_t)__s0, (int8x8_t)__s1, __p2, 40); \ 42364 __ret; \ 42365 }) 42366 #else 42367 #define vluti2q_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 42368 float16x8_t __ret; \ 42369 float16x8_t __s0 = __p0; \ 42370 uint8x8_t __s1 = __p1; \ 42371 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 42372 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 42373 __ret = (float16x8_t) __builtin_neon_vluti2q_lane_f16((int8x16_t)__rev0, (int8x8_t)__rev1, __p2, 40); \ 42374 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 42375 __ret; \ 42376 }) 42377 #endif 42378 42379 #ifdef __LITTLE_ENDIAN__ 42380 #define vluti2q_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 42381 int16x8_t __ret; \ 42382 int16x8_t __s0 = __p0; \ 42383 uint8x8_t __s1 = __p1; \ 42384 __ret = (int16x8_t) __builtin_neon_vluti2q_lane_s16((int8x16_t)__s0, (int8x8_t)__s1, __p2, 33); \ 42385 __ret; \ 42386 }) 42387 #else 42388 #define vluti2q_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 42389 int16x8_t __ret; \ 42390 int16x8_t __s0 = __p0; \ 42391 uint8x8_t __s1 = __p1; \ 42392 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 42393 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 42394 __ret = (int16x8_t) __builtin_neon_vluti2q_lane_s16((int8x16_t)__rev0, (int8x8_t)__rev1, __p2, 33); \ 42395 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 42396 __ret; \ 42397 }) 42398 #endif 42399 42400 #ifdef __LITTLE_ENDIAN__ 42401 #define vluti2_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 42402 uint16x8_t __ret; \ 42403 uint16x4_t __s0 = __p0; \ 42404 uint8x8_t __s1 = __p1; \ 42405 __ret = (uint16x8_t) __builtin_neon_vluti2_lane_u16((int8x8_t)__s0, (int8x8_t)__s1, __p2, 49); \ 42406 __ret; \ 42407 }) 42408 #else 42409 #define vluti2_lane_u16(__p0, __p1, __p2) __extension__ ({ \ 42410 uint16x8_t __ret; \ 42411 uint16x4_t __s0 = __p0; \ 42412 uint8x8_t __s1 = __p1; \ 42413 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 42414 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 42415 __ret = (uint16x8_t) __builtin_neon_vluti2_lane_u16((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 49); \ 42416 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 42417 __ret; \ 42418 }) 42419 #endif 42420 42421 #ifdef __LITTLE_ENDIAN__ 42422 #define vluti2_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 42423 float16x8_t __ret; \ 42424 float16x4_t __s0 = __p0; \ 42425 uint8x8_t __s1 = __p1; \ 42426 __ret = (float16x8_t) __builtin_neon_vluti2_lane_f16((int8x8_t)__s0, (int8x8_t)__s1, __p2, 40); \ 42427 __ret; \ 42428 }) 42429 #else 42430 #define vluti2_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 42431 float16x8_t __ret; \ 42432 float16x4_t __s0 = __p0; \ 42433 uint8x8_t __s1 = __p1; \ 42434 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 42435 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 42436 __ret = (float16x8_t) __builtin_neon_vluti2_lane_f16((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 40); \ 42437 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 42438 __ret; \ 42439 }) 42440 #endif 42441 42442 #ifdef __LITTLE_ENDIAN__ 42443 #define vluti2_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 42444 int16x8_t __ret; \ 42445 int16x4_t __s0 = __p0; \ 42446 uint8x8_t __s1 = __p1; \ 42447 __ret = (int16x8_t) __builtin_neon_vluti2_lane_s16((int8x8_t)__s0, (int8x8_t)__s1, __p2, 33); \ 42448 __ret; \ 42449 }) 42450 #else 42451 #define vluti2_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 42452 int16x8_t __ret; \ 42453 int16x4_t __s0 = __p0; \ 42454 uint8x8_t __s1 = __p1; \ 42455 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 42456 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 42457 __ret = (int16x8_t) __builtin_neon_vluti2_lane_s16((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 33); \ 42458 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 42459 __ret; \ 42460 }) 42461 #endif 42462 42463 #ifdef __LITTLE_ENDIAN__ 42464 #define vluti2_laneq_p8(__p0, __p1, __p2) __extension__ ({ \ 42465 poly8x16_t __ret; \ 42466 poly8x8_t __s0 = __p0; \ 42467 uint8x16_t __s1 = __p1; \ 42468 __ret = (poly8x16_t) __builtin_neon_vluti2_laneq_p8((int8x8_t)__s0, (int8x16_t)__s1, __p2, 36); \ 42469 __ret; \ 42470 }) 42471 #else 42472 #define vluti2_laneq_p8(__p0, __p1, __p2) __extension__ ({ \ 42473 poly8x16_t __ret; \ 42474 poly8x8_t __s0 = __p0; \ 42475 uint8x16_t __s1 = __p1; \ 42476 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 42477 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42478 __ret = (poly8x16_t) __builtin_neon_vluti2_laneq_p8((int8x8_t)__rev0, (int8x16_t)__rev1, __p2, 36); \ 42479 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42480 __ret; \ 42481 }) 42482 #endif 42483 42484 #ifdef __LITTLE_ENDIAN__ 42485 #define vluti2q_laneq_p8(__p0, __p1, __p2) __extension__ ({ \ 42486 poly8x16_t __ret; \ 42487 poly8x16_t __s0 = __p0; \ 42488 uint8x16_t __s1 = __p1; \ 42489 __ret = (poly8x16_t) __builtin_neon_vluti2q_laneq_p8((int8x16_t)__s0, (int8x16_t)__s1, __p2, 36); \ 42490 __ret; \ 42491 }) 42492 #else 42493 #define vluti2q_laneq_p8(__p0, __p1, __p2) __extension__ ({ \ 42494 poly8x16_t __ret; \ 42495 poly8x16_t __s0 = __p0; \ 42496 uint8x16_t __s1 = __p1; \ 42497 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42498 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42499 __ret = (poly8x16_t) __builtin_neon_vluti2q_laneq_p8((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 36); \ 42500 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42501 __ret; \ 42502 }) 42503 #endif 42504 42505 #ifdef __LITTLE_ENDIAN__ 42506 #define vluti2q_laneq_u8(__p0, __p1, __p2) __extension__ ({ \ 42507 uint8x16_t __ret; \ 42508 uint8x16_t __s0 = __p0; \ 42509 uint8x16_t __s1 = __p1; \ 42510 __ret = (uint8x16_t) __builtin_neon_vluti2q_laneq_u8((int8x16_t)__s0, (int8x16_t)__s1, __p2, 48); \ 42511 __ret; \ 42512 }) 42513 #else 42514 #define vluti2q_laneq_u8(__p0, __p1, __p2) __extension__ ({ \ 42515 uint8x16_t __ret; \ 42516 uint8x16_t __s0 = __p0; \ 42517 uint8x16_t __s1 = __p1; \ 42518 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42519 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42520 __ret = (uint8x16_t) __builtin_neon_vluti2q_laneq_u8((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 48); \ 42521 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42522 __ret; \ 42523 }) 42524 #endif 42525 42526 #ifdef __LITTLE_ENDIAN__ 42527 #define vluti2q_laneq_s8(__p0, __p1, __p2) __extension__ ({ \ 42528 int8x16_t __ret; \ 42529 int8x16_t __s0 = __p0; \ 42530 uint8x16_t __s1 = __p1; \ 42531 __ret = (int8x16_t) __builtin_neon_vluti2q_laneq_s8((int8x16_t)__s0, (int8x16_t)__s1, __p2, 32); \ 42532 __ret; \ 42533 }) 42534 #else 42535 #define vluti2q_laneq_s8(__p0, __p1, __p2) __extension__ ({ \ 42536 int8x16_t __ret; \ 42537 int8x16_t __s0 = __p0; \ 42538 uint8x16_t __s1 = __p1; \ 42539 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42540 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42541 __ret = (int8x16_t) __builtin_neon_vluti2q_laneq_s8((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 32); \ 42542 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42543 __ret; \ 42544 }) 42545 #endif 42546 42547 #ifdef __LITTLE_ENDIAN__ 42548 #define vluti2_laneq_u8(__p0, __p1, __p2) __extension__ ({ \ 42549 uint8x16_t __ret; \ 42550 uint8x8_t __s0 = __p0; \ 42551 uint8x16_t __s1 = __p1; \ 42552 __ret = (uint8x16_t) __builtin_neon_vluti2_laneq_u8((int8x8_t)__s0, (int8x16_t)__s1, __p2, 48); \ 42553 __ret; \ 42554 }) 42555 #else 42556 #define vluti2_laneq_u8(__p0, __p1, __p2) __extension__ ({ \ 42557 uint8x16_t __ret; \ 42558 uint8x8_t __s0 = __p0; \ 42559 uint8x16_t __s1 = __p1; \ 42560 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 42561 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42562 __ret = (uint8x16_t) __builtin_neon_vluti2_laneq_u8((int8x8_t)__rev0, (int8x16_t)__rev1, __p2, 48); \ 42563 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42564 __ret; \ 42565 }) 42566 #endif 42567 42568 #ifdef __LITTLE_ENDIAN__ 42569 #define vluti2_laneq_s8(__p0, __p1, __p2) __extension__ ({ \ 42570 int8x16_t __ret; \ 42571 int8x8_t __s0 = __p0; \ 42572 uint8x16_t __s1 = __p1; \ 42573 __ret = (int8x16_t) __builtin_neon_vluti2_laneq_s8((int8x8_t)__s0, (int8x16_t)__s1, __p2, 32); \ 42574 __ret; \ 42575 }) 42576 #else 42577 #define vluti2_laneq_s8(__p0, __p1, __p2) __extension__ ({ \ 42578 int8x16_t __ret; \ 42579 int8x8_t __s0 = __p0; \ 42580 uint8x16_t __s1 = __p1; \ 42581 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 42582 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42583 __ret = (int8x16_t) __builtin_neon_vluti2_laneq_s8((int8x8_t)__rev0, (int8x16_t)__rev1, __p2, 32); \ 42584 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42585 __ret; \ 42586 }) 42587 #endif 42588 42589 #ifdef __LITTLE_ENDIAN__ 42590 #define vluti2_laneq_p16(__p0, __p1, __p2) __extension__ ({ \ 42591 poly16x8_t __ret; \ 42592 poly16x4_t __s0 = __p0; \ 42593 uint8x16_t __s1 = __p1; \ 42594 __ret = (poly16x8_t) __builtin_neon_vluti2_laneq_p16((int8x8_t)__s0, (int8x16_t)__s1, __p2, 37); \ 42595 __ret; \ 42596 }) 42597 #else 42598 #define vluti2_laneq_p16(__p0, __p1, __p2) __extension__ ({ \ 42599 poly16x8_t __ret; \ 42600 poly16x4_t __s0 = __p0; \ 42601 uint8x16_t __s1 = __p1; \ 42602 poly16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 42603 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42604 __ret = (poly16x8_t) __builtin_neon_vluti2_laneq_p16((int8x8_t)__rev0, (int8x16_t)__rev1, __p2, 37); \ 42605 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 42606 __ret; \ 42607 }) 42608 #endif 42609 42610 #ifdef __LITTLE_ENDIAN__ 42611 #define vluti2q_laneq_p16(__p0, __p1, __p2) __extension__ ({ \ 42612 poly16x8_t __ret; \ 42613 poly16x8_t __s0 = __p0; \ 42614 uint8x16_t __s1 = __p1; \ 42615 __ret = (poly16x8_t) __builtin_neon_vluti2q_laneq_p16((int8x16_t)__s0, (int8x16_t)__s1, __p2, 37); \ 42616 __ret; \ 42617 }) 42618 #else 42619 #define vluti2q_laneq_p16(__p0, __p1, __p2) __extension__ ({ \ 42620 poly16x8_t __ret; \ 42621 poly16x8_t __s0 = __p0; \ 42622 uint8x16_t __s1 = __p1; \ 42623 poly16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 42624 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42625 __ret = (poly16x8_t) __builtin_neon_vluti2q_laneq_p16((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 37); \ 42626 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 42627 __ret; \ 42628 }) 42629 #endif 42630 42631 #ifdef __LITTLE_ENDIAN__ 42632 #define vluti2q_laneq_u16(__p0, __p1, __p2) __extension__ ({ \ 42633 uint16x8_t __ret; \ 42634 uint16x8_t __s0 = __p0; \ 42635 uint8x16_t __s1 = __p1; \ 42636 __ret = (uint16x8_t) __builtin_neon_vluti2q_laneq_u16((int8x16_t)__s0, (int8x16_t)__s1, __p2, 49); \ 42637 __ret; \ 42638 }) 42639 #else 42640 #define vluti2q_laneq_u16(__p0, __p1, __p2) __extension__ ({ \ 42641 uint16x8_t __ret; \ 42642 uint16x8_t __s0 = __p0; \ 42643 uint8x16_t __s1 = __p1; \ 42644 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 42645 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42646 __ret = (uint16x8_t) __builtin_neon_vluti2q_laneq_u16((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 49); \ 42647 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 42648 __ret; \ 42649 }) 42650 #endif 42651 42652 #ifdef __LITTLE_ENDIAN__ 42653 #define vluti2q_laneq_f16(__p0, __p1, __p2) __extension__ ({ \ 42654 float16x8_t __ret; \ 42655 float16x8_t __s0 = __p0; \ 42656 uint8x16_t __s1 = __p1; \ 42657 __ret = (float16x8_t) __builtin_neon_vluti2q_laneq_f16((int8x16_t)__s0, (int8x16_t)__s1, __p2, 40); \ 42658 __ret; \ 42659 }) 42660 #else 42661 #define vluti2q_laneq_f16(__p0, __p1, __p2) __extension__ ({ \ 42662 float16x8_t __ret; \ 42663 float16x8_t __s0 = __p0; \ 42664 uint8x16_t __s1 = __p1; \ 42665 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 42666 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42667 __ret = (float16x8_t) __builtin_neon_vluti2q_laneq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 40); \ 42668 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 42669 __ret; \ 42670 }) 42671 #endif 42672 42673 #ifdef __LITTLE_ENDIAN__ 42674 #define vluti2q_laneq_s16(__p0, __p1, __p2) __extension__ ({ \ 42675 int16x8_t __ret; \ 42676 int16x8_t __s0 = __p0; \ 42677 uint8x16_t __s1 = __p1; \ 42678 __ret = (int16x8_t) __builtin_neon_vluti2q_laneq_s16((int8x16_t)__s0, (int8x16_t)__s1, __p2, 33); \ 42679 __ret; \ 42680 }) 42681 #else 42682 #define vluti2q_laneq_s16(__p0, __p1, __p2) __extension__ ({ \ 42683 int16x8_t __ret; \ 42684 int16x8_t __s0 = __p0; \ 42685 uint8x16_t __s1 = __p1; \ 42686 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 42687 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42688 __ret = (int16x8_t) __builtin_neon_vluti2q_laneq_s16((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 33); \ 42689 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 42690 __ret; \ 42691 }) 42692 #endif 42693 42694 #ifdef __LITTLE_ENDIAN__ 42695 #define vluti2_laneq_u16(__p0, __p1, __p2) __extension__ ({ \ 42696 uint16x8_t __ret; \ 42697 uint16x4_t __s0 = __p0; \ 42698 uint8x16_t __s1 = __p1; \ 42699 __ret = (uint16x8_t) __builtin_neon_vluti2_laneq_u16((int8x8_t)__s0, (int8x16_t)__s1, __p2, 49); \ 42700 __ret; \ 42701 }) 42702 #else 42703 #define vluti2_laneq_u16(__p0, __p1, __p2) __extension__ ({ \ 42704 uint16x8_t __ret; \ 42705 uint16x4_t __s0 = __p0; \ 42706 uint8x16_t __s1 = __p1; \ 42707 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 42708 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42709 __ret = (uint16x8_t) __builtin_neon_vluti2_laneq_u16((int8x8_t)__rev0, (int8x16_t)__rev1, __p2, 49); \ 42710 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 42711 __ret; \ 42712 }) 42713 #endif 42714 42715 #ifdef __LITTLE_ENDIAN__ 42716 #define vluti2_laneq_f16(__p0, __p1, __p2) __extension__ ({ \ 42717 float16x8_t __ret; \ 42718 float16x4_t __s0 = __p0; \ 42719 uint8x16_t __s1 = __p1; \ 42720 __ret = (float16x8_t) __builtin_neon_vluti2_laneq_f16((int8x8_t)__s0, (int8x16_t)__s1, __p2, 40); \ 42721 __ret; \ 42722 }) 42723 #else 42724 #define vluti2_laneq_f16(__p0, __p1, __p2) __extension__ ({ \ 42725 float16x8_t __ret; \ 42726 float16x4_t __s0 = __p0; \ 42727 uint8x16_t __s1 = __p1; \ 42728 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 42729 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42730 __ret = (float16x8_t) __builtin_neon_vluti2_laneq_f16((int8x8_t)__rev0, (int8x16_t)__rev1, __p2, 40); \ 42731 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 42732 __ret; \ 42733 }) 42734 #endif 42735 42736 #ifdef __LITTLE_ENDIAN__ 42737 #define vluti2_laneq_s16(__p0, __p1, __p2) __extension__ ({ \ 42738 int16x8_t __ret; \ 42739 int16x4_t __s0 = __p0; \ 42740 uint8x16_t __s1 = __p1; \ 42741 __ret = (int16x8_t) __builtin_neon_vluti2_laneq_s16((int8x8_t)__s0, (int8x16_t)__s1, __p2, 33); \ 42742 __ret; \ 42743 }) 42744 #else 42745 #define vluti2_laneq_s16(__p0, __p1, __p2) __extension__ ({ \ 42746 int16x8_t __ret; \ 42747 int16x4_t __s0 = __p0; \ 42748 uint8x16_t __s1 = __p1; \ 42749 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 42750 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42751 __ret = (int16x8_t) __builtin_neon_vluti2_laneq_s16((int8x8_t)__rev0, (int8x16_t)__rev1, __p2, 33); \ 42752 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 42753 __ret; \ 42754 }) 42755 #endif 42756 42757 #ifdef __LITTLE_ENDIAN__ 42758 #define vluti4q_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 42759 poly8x16_t __ret; \ 42760 poly8x16_t __s0 = __p0; \ 42761 uint8x8_t __s1 = __p1; \ 42762 __ret = (poly8x16_t) __builtin_neon_vluti4q_lane_p8((int8x16_t)__s0, (int8x8_t)__s1, __p2, 36); \ 42763 __ret; \ 42764 }) 42765 #else 42766 #define vluti4q_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 42767 poly8x16_t __ret; \ 42768 poly8x16_t __s0 = __p0; \ 42769 uint8x8_t __s1 = __p1; \ 42770 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42771 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 42772 __ret = (poly8x16_t) __builtin_neon_vluti4q_lane_p8((int8x16_t)__rev0, (int8x8_t)__rev1, __p2, 36); \ 42773 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42774 __ret; \ 42775 }) 42776 #endif 42777 42778 #ifdef __LITTLE_ENDIAN__ 42779 #define vluti4q_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 42780 uint8x16_t __ret; \ 42781 uint8x16_t __s0 = __p0; \ 42782 uint8x8_t __s1 = __p1; \ 42783 __ret = (uint8x16_t) __builtin_neon_vluti4q_lane_u8((int8x16_t)__s0, (int8x8_t)__s1, __p2, 48); \ 42784 __ret; \ 42785 }) 42786 #else 42787 #define vluti4q_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 42788 uint8x16_t __ret; \ 42789 uint8x16_t __s0 = __p0; \ 42790 uint8x8_t __s1 = __p1; \ 42791 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42792 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 42793 __ret = (uint8x16_t) __builtin_neon_vluti4q_lane_u8((int8x16_t)__rev0, (int8x8_t)__rev1, __p2, 48); \ 42794 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42795 __ret; \ 42796 }) 42797 #endif 42798 42799 #ifdef __LITTLE_ENDIAN__ 42800 #define vluti4q_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 42801 int8x16_t __ret; \ 42802 int8x16_t __s0 = __p0; \ 42803 uint8x8_t __s1 = __p1; \ 42804 __ret = (int8x16_t) __builtin_neon_vluti4q_lane_s8((int8x16_t)__s0, (int8x8_t)__s1, __p2, 32); \ 42805 __ret; \ 42806 }) 42807 #else 42808 #define vluti4q_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 42809 int8x16_t __ret; \ 42810 int8x16_t __s0 = __p0; \ 42811 uint8x8_t __s1 = __p1; \ 42812 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42813 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 42814 __ret = (int8x16_t) __builtin_neon_vluti4q_lane_s8((int8x16_t)__rev0, (int8x8_t)__rev1, __p2, 32); \ 42815 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42816 __ret; \ 42817 }) 42818 #endif 42819 42820 #ifdef __LITTLE_ENDIAN__ 42821 #define vluti4q_lane_p16_x2(__p0, __p1, __p2) __extension__ ({ \ 42822 poly16x8_t __ret; \ 42823 poly16x8x2_t __s0 = __p0; \ 42824 uint8x8_t __s1 = __p1; \ 42825 __ret = (poly16x8_t) __builtin_neon_vluti4q_lane_p16_x2((int8x16_t)__s0.val[0], (int8x16_t)__s0.val[1], (int8x8_t)__s1, __p2, 37); \ 42826 __ret; \ 42827 }) 42828 #else 42829 #define vluti4q_lane_p16_x2(__p0, __p1, __p2) __extension__ ({ \ 42830 poly16x8_t __ret; \ 42831 poly16x8x2_t __s0 = __p0; \ 42832 uint8x8_t __s1 = __p1; \ 42833 poly16x8x2_t __rev0; \ 42834 __rev0.val[0] = __builtin_shufflevector(__s0.val[0], __s0.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 42835 __rev0.val[1] = __builtin_shufflevector(__s0.val[1], __s0.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 42836 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 42837 __ret = (poly16x8_t) __builtin_neon_vluti4q_lane_p16_x2((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x8_t)__rev1, __p2, 37); \ 42838 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 42839 __ret; \ 42840 }) 42841 #endif 42842 42843 #ifdef __LITTLE_ENDIAN__ 42844 #define vluti4q_lane_u16_x2(__p0, __p1, __p2) __extension__ ({ \ 42845 uint16x8_t __ret; \ 42846 uint16x8x2_t __s0 = __p0; \ 42847 uint8x8_t __s1 = __p1; \ 42848 __ret = (uint16x8_t) __builtin_neon_vluti4q_lane_u16_x2((int8x16_t)__s0.val[0], (int8x16_t)__s0.val[1], (int8x8_t)__s1, __p2, 49); \ 42849 __ret; \ 42850 }) 42851 #else 42852 #define vluti4q_lane_u16_x2(__p0, __p1, __p2) __extension__ ({ \ 42853 uint16x8_t __ret; \ 42854 uint16x8x2_t __s0 = __p0; \ 42855 uint8x8_t __s1 = __p1; \ 42856 uint16x8x2_t __rev0; \ 42857 __rev0.val[0] = __builtin_shufflevector(__s0.val[0], __s0.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 42858 __rev0.val[1] = __builtin_shufflevector(__s0.val[1], __s0.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 42859 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 42860 __ret = (uint16x8_t) __builtin_neon_vluti4q_lane_u16_x2((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x8_t)__rev1, __p2, 49); \ 42861 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 42862 __ret; \ 42863 }) 42864 #endif 42865 42866 #ifdef __LITTLE_ENDIAN__ 42867 #define vluti4q_lane_f16_x2(__p0, __p1, __p2) __extension__ ({ \ 42868 float16x8_t __ret; \ 42869 float16x8x2_t __s0 = __p0; \ 42870 uint8x8_t __s1 = __p1; \ 42871 __ret = (float16x8_t) __builtin_neon_vluti4q_lane_f16_x2((int8x16_t)__s0.val[0], (int8x16_t)__s0.val[1], (int8x8_t)__s1, __p2, 40); \ 42872 __ret; \ 42873 }) 42874 #else 42875 #define vluti4q_lane_f16_x2(__p0, __p1, __p2) __extension__ ({ \ 42876 float16x8_t __ret; \ 42877 float16x8x2_t __s0 = __p0; \ 42878 uint8x8_t __s1 = __p1; \ 42879 float16x8x2_t __rev0; \ 42880 __rev0.val[0] = __builtin_shufflevector(__s0.val[0], __s0.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 42881 __rev0.val[1] = __builtin_shufflevector(__s0.val[1], __s0.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 42882 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 42883 __ret = (float16x8_t) __builtin_neon_vluti4q_lane_f16_x2((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x8_t)__rev1, __p2, 40); \ 42884 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 42885 __ret; \ 42886 }) 42887 #endif 42888 42889 #ifdef __LITTLE_ENDIAN__ 42890 #define vluti4q_lane_s16_x2(__p0, __p1, __p2) __extension__ ({ \ 42891 int16x8_t __ret; \ 42892 int16x8x2_t __s0 = __p0; \ 42893 uint8x8_t __s1 = __p1; \ 42894 __ret = (int16x8_t) __builtin_neon_vluti4q_lane_s16_x2((int8x16_t)__s0.val[0], (int8x16_t)__s0.val[1], (int8x8_t)__s1, __p2, 33); \ 42895 __ret; \ 42896 }) 42897 #else 42898 #define vluti4q_lane_s16_x2(__p0, __p1, __p2) __extension__ ({ \ 42899 int16x8_t __ret; \ 42900 int16x8x2_t __s0 = __p0; \ 42901 uint8x8_t __s1 = __p1; \ 42902 int16x8x2_t __rev0; \ 42903 __rev0.val[0] = __builtin_shufflevector(__s0.val[0], __s0.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 42904 __rev0.val[1] = __builtin_shufflevector(__s0.val[1], __s0.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 42905 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 42906 __ret = (int16x8_t) __builtin_neon_vluti4q_lane_s16_x2((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x8_t)__rev1, __p2, 33); \ 42907 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 42908 __ret; \ 42909 }) 42910 #endif 42911 42912 #ifdef __LITTLE_ENDIAN__ 42913 #define vluti4q_laneq_p8(__p0, __p1, __p2) __extension__ ({ \ 42914 poly8x16_t __ret; \ 42915 poly8x16_t __s0 = __p0; \ 42916 uint8x16_t __s1 = __p1; \ 42917 __ret = (poly8x16_t) __builtin_neon_vluti4q_laneq_p8((int8x16_t)__s0, (int8x16_t)__s1, __p2, 36); \ 42918 __ret; \ 42919 }) 42920 #else 42921 #define vluti4q_laneq_p8(__p0, __p1, __p2) __extension__ ({ \ 42922 poly8x16_t __ret; \ 42923 poly8x16_t __s0 = __p0; \ 42924 uint8x16_t __s1 = __p1; \ 42925 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42926 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42927 __ret = (poly8x16_t) __builtin_neon_vluti4q_laneq_p8((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 36); \ 42928 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42929 __ret; \ 42930 }) 42931 #endif 42932 42933 #ifdef __LITTLE_ENDIAN__ 42934 #define vluti4q_laneq_u8(__p0, __p1, __p2) __extension__ ({ \ 42935 uint8x16_t __ret; \ 42936 uint8x16_t __s0 = __p0; \ 42937 uint8x16_t __s1 = __p1; \ 42938 __ret = (uint8x16_t) __builtin_neon_vluti4q_laneq_u8((int8x16_t)__s0, (int8x16_t)__s1, __p2, 48); \ 42939 __ret; \ 42940 }) 42941 #else 42942 #define vluti4q_laneq_u8(__p0, __p1, __p2) __extension__ ({ \ 42943 uint8x16_t __ret; \ 42944 uint8x16_t __s0 = __p0; \ 42945 uint8x16_t __s1 = __p1; \ 42946 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42947 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42948 __ret = (uint8x16_t) __builtin_neon_vluti4q_laneq_u8((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 48); \ 42949 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42950 __ret; \ 42951 }) 42952 #endif 42953 42954 #ifdef __LITTLE_ENDIAN__ 42955 #define vluti4q_laneq_s8(__p0, __p1, __p2) __extension__ ({ \ 42956 int8x16_t __ret; \ 42957 int8x16_t __s0 = __p0; \ 42958 uint8x16_t __s1 = __p1; \ 42959 __ret = (int8x16_t) __builtin_neon_vluti4q_laneq_s8((int8x16_t)__s0, (int8x16_t)__s1, __p2, 32); \ 42960 __ret; \ 42961 }) 42962 #else 42963 #define vluti4q_laneq_s8(__p0, __p1, __p2) __extension__ ({ \ 42964 int8x16_t __ret; \ 42965 int8x16_t __s0 = __p0; \ 42966 uint8x16_t __s1 = __p1; \ 42967 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42968 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42969 __ret = (int8x16_t) __builtin_neon_vluti4q_laneq_s8((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 32); \ 42970 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42971 __ret; \ 42972 }) 42973 #endif 42974 42975 #ifdef __LITTLE_ENDIAN__ 42976 #define vluti4q_laneq_p16_x2(__p0, __p1, __p2) __extension__ ({ \ 42977 poly16x8_t __ret; \ 42978 poly16x8x2_t __s0 = __p0; \ 42979 uint8x16_t __s1 = __p1; \ 42980 __ret = (poly16x8_t) __builtin_neon_vluti4q_laneq_p16_x2((int8x16_t)__s0.val[0], (int8x16_t)__s0.val[1], (int8x16_t)__s1, __p2, 37); \ 42981 __ret; \ 42982 }) 42983 #else 42984 #define vluti4q_laneq_p16_x2(__p0, __p1, __p2) __extension__ ({ \ 42985 poly16x8_t __ret; \ 42986 poly16x8x2_t __s0 = __p0; \ 42987 uint8x16_t __s1 = __p1; \ 42988 poly16x8x2_t __rev0; \ 42989 __rev0.val[0] = __builtin_shufflevector(__s0.val[0], __s0.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 42990 __rev0.val[1] = __builtin_shufflevector(__s0.val[1], __s0.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 42991 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 42992 __ret = (poly16x8_t) __builtin_neon_vluti4q_laneq_p16_x2((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev1, __p2, 37); \ 42993 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 42994 __ret; \ 42995 }) 42996 #endif 42997 42998 #ifdef __LITTLE_ENDIAN__ 42999 #define vluti4q_laneq_u16_x2(__p0, __p1, __p2) __extension__ ({ \ 43000 uint16x8_t __ret; \ 43001 uint16x8x2_t __s0 = __p0; \ 43002 uint8x16_t __s1 = __p1; \ 43003 __ret = (uint16x8_t) __builtin_neon_vluti4q_laneq_u16_x2((int8x16_t)__s0.val[0], (int8x16_t)__s0.val[1], (int8x16_t)__s1, __p2, 49); \ 43004 __ret; \ 43005 }) 43006 #else 43007 #define vluti4q_laneq_u16_x2(__p0, __p1, __p2) __extension__ ({ \ 43008 uint16x8_t __ret; \ 43009 uint16x8x2_t __s0 = __p0; \ 43010 uint8x16_t __s1 = __p1; \ 43011 uint16x8x2_t __rev0; \ 43012 __rev0.val[0] = __builtin_shufflevector(__s0.val[0], __s0.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 43013 __rev0.val[1] = __builtin_shufflevector(__s0.val[1], __s0.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 43014 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 43015 __ret = (uint16x8_t) __builtin_neon_vluti4q_laneq_u16_x2((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev1, __p2, 49); \ 43016 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 43017 __ret; \ 43018 }) 43019 #endif 43020 43021 #ifdef __LITTLE_ENDIAN__ 43022 #define vluti4q_laneq_f16_x2(__p0, __p1, __p2) __extension__ ({ \ 43023 float16x8_t __ret; \ 43024 float16x8x2_t __s0 = __p0; \ 43025 uint8x16_t __s1 = __p1; \ 43026 __ret = (float16x8_t) __builtin_neon_vluti4q_laneq_f16_x2((int8x16_t)__s0.val[0], (int8x16_t)__s0.val[1], (int8x16_t)__s1, __p2, 40); \ 43027 __ret; \ 43028 }) 43029 #else 43030 #define vluti4q_laneq_f16_x2(__p0, __p1, __p2) __extension__ ({ \ 43031 float16x8_t __ret; \ 43032 float16x8x2_t __s0 = __p0; \ 43033 uint8x16_t __s1 = __p1; \ 43034 float16x8x2_t __rev0; \ 43035 __rev0.val[0] = __builtin_shufflevector(__s0.val[0], __s0.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 43036 __rev0.val[1] = __builtin_shufflevector(__s0.val[1], __s0.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 43037 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 43038 __ret = (float16x8_t) __builtin_neon_vluti4q_laneq_f16_x2((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev1, __p2, 40); \ 43039 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 43040 __ret; \ 43041 }) 43042 #endif 43043 43044 #ifdef __LITTLE_ENDIAN__ 43045 #define vluti4q_laneq_s16_x2(__p0, __p1, __p2) __extension__ ({ \ 43046 int16x8_t __ret; \ 43047 int16x8x2_t __s0 = __p0; \ 43048 uint8x16_t __s1 = __p1; \ 43049 __ret = (int16x8_t) __builtin_neon_vluti4q_laneq_s16_x2((int8x16_t)__s0.val[0], (int8x16_t)__s0.val[1], (int8x16_t)__s1, __p2, 33); \ 43050 __ret; \ 43051 }) 43052 #else 43053 #define vluti4q_laneq_s16_x2(__p0, __p1, __p2) __extension__ ({ \ 43054 int16x8_t __ret; \ 43055 int16x8x2_t __s0 = __p0; \ 43056 uint8x16_t __s1 = __p1; \ 43057 int16x8x2_t __rev0; \ 43058 __rev0.val[0] = __builtin_shufflevector(__s0.val[0], __s0.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 43059 __rev0.val[1] = __builtin_shufflevector(__s0.val[1], __s0.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 43060 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 43061 __ret = (int16x8_t) __builtin_neon_vluti4q_laneq_s16_x2((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev1, __p2, 33); \ 43062 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 43063 __ret; \ 43064 }) 43065 #endif 43066 43067 #ifdef __LITTLE_ENDIAN__ 43068 #define vluti2q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 43069 bfloat16x8_t __ret; \ 43070 bfloat16x8_t __s0 = __p0; \ 43071 uint8x8_t __s1 = __p1; \ 43072 __ret = (bfloat16x8_t) __builtin_neon_vluti2q_lane_bf16((int8x16_t)__s0, (int8x8_t)__s1, __p2, 43); \ 43073 __ret; \ 43074 }) 43075 #else 43076 #define vluti2q_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 43077 bfloat16x8_t __ret; \ 43078 bfloat16x8_t __s0 = __p0; \ 43079 uint8x8_t __s1 = __p1; \ 43080 bfloat16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 43081 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 43082 __ret = (bfloat16x8_t) __builtin_neon_vluti2q_lane_bf16((int8x16_t)__rev0, (int8x8_t)__rev1, __p2, 43); \ 43083 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 43084 __ret; \ 43085 }) 43086 #endif 43087 43088 #ifdef __LITTLE_ENDIAN__ 43089 #define vluti2_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 43090 bfloat16x8_t __ret; \ 43091 bfloat16x4_t __s0 = __p0; \ 43092 uint8x8_t __s1 = __p1; \ 43093 __ret = (bfloat16x8_t) __builtin_neon_vluti2_lane_bf16((int8x8_t)__s0, (int8x8_t)__s1, __p2, 43); \ 43094 __ret; \ 43095 }) 43096 #else 43097 #define vluti2_lane_bf16(__p0, __p1, __p2) __extension__ ({ \ 43098 bfloat16x8_t __ret; \ 43099 bfloat16x4_t __s0 = __p0; \ 43100 uint8x8_t __s1 = __p1; \ 43101 bfloat16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 43102 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 43103 __ret = (bfloat16x8_t) __builtin_neon_vluti2_lane_bf16((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 43); \ 43104 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 43105 __ret; \ 43106 }) 43107 #endif 43108 43109 #ifdef __LITTLE_ENDIAN__ 43110 #define vluti2q_laneq_bf16(__p0, __p1, __p2) __extension__ ({ \ 43111 bfloat16x8_t __ret; \ 43112 bfloat16x8_t __s0 = __p0; \ 43113 uint8x16_t __s1 = __p1; \ 43114 __ret = (bfloat16x8_t) __builtin_neon_vluti2q_laneq_bf16((int8x16_t)__s0, (int8x16_t)__s1, __p2, 43); \ 43115 __ret; \ 43116 }) 43117 #else 43118 #define vluti2q_laneq_bf16(__p0, __p1, __p2) __extension__ ({ \ 43119 bfloat16x8_t __ret; \ 43120 bfloat16x8_t __s0 = __p0; \ 43121 uint8x16_t __s1 = __p1; \ 43122 bfloat16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 43123 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 43124 __ret = (bfloat16x8_t) __builtin_neon_vluti2q_laneq_bf16((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 43); \ 43125 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 43126 __ret; \ 43127 }) 43128 #endif 43129 43130 #ifdef __LITTLE_ENDIAN__ 43131 #define vluti2_laneq_bf16(__p0, __p1, __p2) __extension__ ({ \ 43132 bfloat16x8_t __ret; \ 43133 bfloat16x4_t __s0 = __p0; \ 43134 uint8x16_t __s1 = __p1; \ 43135 __ret = (bfloat16x8_t) __builtin_neon_vluti2_laneq_bf16((int8x8_t)__s0, (int8x16_t)__s1, __p2, 43); \ 43136 __ret; \ 43137 }) 43138 #else 43139 #define vluti2_laneq_bf16(__p0, __p1, __p2) __extension__ ({ \ 43140 bfloat16x8_t __ret; \ 43141 bfloat16x4_t __s0 = __p0; \ 43142 uint8x16_t __s1 = __p1; \ 43143 bfloat16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 43144 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 43145 __ret = (bfloat16x8_t) __builtin_neon_vluti2_laneq_bf16((int8x8_t)__rev0, (int8x16_t)__rev1, __p2, 43); \ 43146 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 43147 __ret; \ 43148 }) 43149 #endif 43150 43151 #ifdef __LITTLE_ENDIAN__ 43152 #define vluti4q_lane_bf16_x2(__p0, __p1, __p2) __extension__ ({ \ 43153 bfloat16x8_t __ret; \ 43154 bfloat16x8x2_t __s0 = __p0; \ 43155 uint8x8_t __s1 = __p1; \ 43156 __ret = (bfloat16x8_t) __builtin_neon_vluti4q_lane_bf16_x2((int8x16_t)__s0.val[0], (int8x16_t)__s0.val[1], (int8x8_t)__s1, __p2, 43); \ 43157 __ret; \ 43158 }) 43159 #else 43160 #define vluti4q_lane_bf16_x2(__p0, __p1, __p2) __extension__ ({ \ 43161 bfloat16x8_t __ret; \ 43162 bfloat16x8x2_t __s0 = __p0; \ 43163 uint8x8_t __s1 = __p1; \ 43164 bfloat16x8x2_t __rev0; \ 43165 __rev0.val[0] = __builtin_shufflevector(__s0.val[0], __s0.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 43166 __rev0.val[1] = __builtin_shufflevector(__s0.val[1], __s0.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 43167 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 43168 __ret = (bfloat16x8_t) __builtin_neon_vluti4q_lane_bf16_x2((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x8_t)__rev1, __p2, 43); \ 43169 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 43170 __ret; \ 43171 }) 43172 #endif 43173 43174 #ifdef __LITTLE_ENDIAN__ 43175 #define vluti4q_laneq_bf16_x2(__p0, __p1, __p2) __extension__ ({ \ 43176 bfloat16x8_t __ret; \ 43177 bfloat16x8x2_t __s0 = __p0; \ 43178 uint8x16_t __s1 = __p1; \ 43179 __ret = (bfloat16x8_t) __builtin_neon_vluti4q_laneq_bf16_x2((int8x16_t)__s0.val[0], (int8x16_t)__s0.val[1], (int8x16_t)__s1, __p2, 43); \ 43180 __ret; \ 43181 }) 43182 #else 43183 #define vluti4q_laneq_bf16_x2(__p0, __p1, __p2) __extension__ ({ \ 43184 bfloat16x8_t __ret; \ 43185 bfloat16x8x2_t __s0 = __p0; \ 43186 uint8x16_t __s1 = __p1; \ 43187 bfloat16x8x2_t __rev0; \ 43188 __rev0.val[0] = __builtin_shufflevector(__s0.val[0], __s0.val[0], 7, 6, 5, 4, 3, 2, 1, 0); \ 43189 __rev0.val[1] = __builtin_shufflevector(__s0.val[1], __s0.val[1], 7, 6, 5, 4, 3, 2, 1, 0); \ 43190 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 43191 __ret = (bfloat16x8_t) __builtin_neon_vluti4q_laneq_bf16_x2((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev1, __p2, 43); \ 43192 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 43193 __ret; \ 43194 }) 43195 #endif 43196 43197 #ifdef __LITTLE_ENDIAN__ 43198 __ai __attribute__((target("neon,faminmax"))) float64x2_t vamaxq_f64(float64x2_t __p0, float64x2_t __p1) { 43199 float64x2_t __ret; 43200 __ret = (float64x2_t) __builtin_neon_vamaxq_f64((int8x16_t)__p0, (int8x16_t)__p1, 42); 43201 return __ret; 43202 } 43203 #else 43204 __ai __attribute__((target("neon,faminmax"))) float64x2_t vamaxq_f64(float64x2_t __p0, float64x2_t __p1) { 43205 float64x2_t __ret; 43206 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 43207 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 43208 __ret = (float64x2_t) __builtin_neon_vamaxq_f64((int8x16_t)__rev0, (int8x16_t)__rev1, 42); 43209 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 43210 return __ret; 43211 } 43212 #endif 43213 43214 #ifdef __LITTLE_ENDIAN__ 43215 __ai __attribute__((target("neon,faminmax"))) float32x4_t vamaxq_f32(float32x4_t __p0, float32x4_t __p1) { 43216 float32x4_t __ret; 43217 __ret = (float32x4_t) __builtin_neon_vamaxq_f32((int8x16_t)__p0, (int8x16_t)__p1, 41); 43218 return __ret; 43219 } 43220 #else 43221 __ai __attribute__((target("neon,faminmax"))) float32x4_t vamaxq_f32(float32x4_t __p0, float32x4_t __p1) { 43222 float32x4_t __ret; 43223 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 43224 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 43225 __ret = (float32x4_t) __builtin_neon_vamaxq_f32((int8x16_t)__rev0, (int8x16_t)__rev1, 41); 43226 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 43227 return __ret; 43228 } 43229 #endif 43230 43231 #ifdef __LITTLE_ENDIAN__ 43232 __ai __attribute__((target("neon,faminmax"))) float16x8_t vamaxq_f16(float16x8_t __p0, float16x8_t __p1) { 43233 float16x8_t __ret; 43234 __ret = (float16x8_t) __builtin_neon_vamaxq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40); 43235 return __ret; 43236 } 43237 #else 43238 __ai __attribute__((target("neon,faminmax"))) float16x8_t vamaxq_f16(float16x8_t __p0, float16x8_t __p1) { 43239 float16x8_t __ret; 43240 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 43241 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 43242 __ret = (float16x8_t) __builtin_neon_vamaxq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40); 43243 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 43244 return __ret; 43245 } 43246 #endif 43247 43248 #ifdef __LITTLE_ENDIAN__ 43249 __ai __attribute__((target("neon,faminmax"))) float32x2_t vamax_f32(float32x2_t __p0, float32x2_t __p1) { 43250 float32x2_t __ret; 43251 __ret = (float32x2_t) __builtin_neon_vamax_f32((int8x8_t)__p0, (int8x8_t)__p1, 9); 43252 return __ret; 43253 } 43254 #else 43255 __ai __attribute__((target("neon,faminmax"))) float32x2_t vamax_f32(float32x2_t __p0, float32x2_t __p1) { 43256 float32x2_t __ret; 43257 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 43258 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 43259 __ret = (float32x2_t) __builtin_neon_vamax_f32((int8x8_t)__rev0, (int8x8_t)__rev1, 9); 43260 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 43261 return __ret; 43262 } 43263 #endif 43264 43265 #ifdef __LITTLE_ENDIAN__ 43266 __ai __attribute__((target("neon,faminmax"))) float16x4_t vamax_f16(float16x4_t __p0, float16x4_t __p1) { 43267 float16x4_t __ret; 43268 __ret = (float16x4_t) __builtin_neon_vamax_f16((int8x8_t)__p0, (int8x8_t)__p1, 8); 43269 return __ret; 43270 } 43271 #else 43272 __ai __attribute__((target("neon,faminmax"))) float16x4_t vamax_f16(float16x4_t __p0, float16x4_t __p1) { 43273 float16x4_t __ret; 43274 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 43275 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 43276 __ret = (float16x4_t) __builtin_neon_vamax_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8); 43277 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 43278 return __ret; 43279 } 43280 #endif 43281 43282 #ifdef __LITTLE_ENDIAN__ 43283 __ai __attribute__((target("neon,faminmax"))) float64x2_t vaminq_f64(float64x2_t __p0, float64x2_t __p1) { 43284 float64x2_t __ret; 43285 __ret = (float64x2_t) __builtin_neon_vaminq_f64((int8x16_t)__p0, (int8x16_t)__p1, 42); 43286 return __ret; 43287 } 43288 #else 43289 __ai __attribute__((target("neon,faminmax"))) float64x2_t vaminq_f64(float64x2_t __p0, float64x2_t __p1) { 43290 float64x2_t __ret; 43291 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 43292 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 43293 __ret = (float64x2_t) __builtin_neon_vaminq_f64((int8x16_t)__rev0, (int8x16_t)__rev1, 42); 43294 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 43295 return __ret; 43296 } 43297 #endif 43298 43299 #ifdef __LITTLE_ENDIAN__ 43300 __ai __attribute__((target("neon,faminmax"))) float32x4_t vaminq_f32(float32x4_t __p0, float32x4_t __p1) { 43301 float32x4_t __ret; 43302 __ret = (float32x4_t) __builtin_neon_vaminq_f32((int8x16_t)__p0, (int8x16_t)__p1, 41); 43303 return __ret; 43304 } 43305 #else 43306 __ai __attribute__((target("neon,faminmax"))) float32x4_t vaminq_f32(float32x4_t __p0, float32x4_t __p1) { 43307 float32x4_t __ret; 43308 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 43309 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 43310 __ret = (float32x4_t) __builtin_neon_vaminq_f32((int8x16_t)__rev0, (int8x16_t)__rev1, 41); 43311 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 43312 return __ret; 43313 } 43314 #endif 43315 43316 #ifdef __LITTLE_ENDIAN__ 43317 __ai __attribute__((target("neon,faminmax"))) float16x8_t vaminq_f16(float16x8_t __p0, float16x8_t __p1) { 43318 float16x8_t __ret; 43319 __ret = (float16x8_t) __builtin_neon_vaminq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40); 43320 return __ret; 43321 } 43322 #else 43323 __ai __attribute__((target("neon,faminmax"))) float16x8_t vaminq_f16(float16x8_t __p0, float16x8_t __p1) { 43324 float16x8_t __ret; 43325 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 43326 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 43327 __ret = (float16x8_t) __builtin_neon_vaminq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40); 43328 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 43329 return __ret; 43330 } 43331 #endif 43332 43333 #ifdef __LITTLE_ENDIAN__ 43334 __ai __attribute__((target("neon,faminmax"))) float32x2_t vamin_f32(float32x2_t __p0, float32x2_t __p1) { 43335 float32x2_t __ret; 43336 __ret = (float32x2_t) __builtin_neon_vamin_f32((int8x8_t)__p0, (int8x8_t)__p1, 9); 43337 return __ret; 43338 } 43339 #else 43340 __ai __attribute__((target("neon,faminmax"))) float32x2_t vamin_f32(float32x2_t __p0, float32x2_t __p1) { 43341 float32x2_t __ret; 43342 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 43343 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 43344 __ret = (float32x2_t) __builtin_neon_vamin_f32((int8x8_t)__rev0, (int8x8_t)__rev1, 9); 43345 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 43346 return __ret; 43347 } 43348 #endif 43349 43350 #ifdef __LITTLE_ENDIAN__ 43351 __ai __attribute__((target("neon,faminmax"))) float16x4_t vamin_f16(float16x4_t __p0, float16x4_t __p1) { 43352 float16x4_t __ret; 43353 __ret = (float16x4_t) __builtin_neon_vamin_f16((int8x8_t)__p0, (int8x8_t)__p1, 8); 43354 return __ret; 43355 } 43356 #else 43357 __ai __attribute__((target("neon,faminmax"))) float16x4_t vamin_f16(float16x4_t __p0, float16x4_t __p1) { 43358 float16x4_t __ret; 43359 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 43360 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 43361 __ret = (float16x4_t) __builtin_neon_vamin_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8); 43362 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 43363 return __ret; 43364 } 43365 #endif 43366 43367 #endif 43368 #if defined(__aarch64__) || defined(__arm64ec__) 43369 __ai __attribute__((target("aes,neon"))) poly128_t vmull_p64(poly64_t __p0, poly64_t __p1) { 43370 poly128_t __ret; 43371 __ret = (poly128_t) __builtin_neon_vmull_p64(__p0, __p1); 43372 return __ret; 43373 } 43374 #ifdef __LITTLE_ENDIAN__ 43375 #define vcopyq_lane_bf16(__p0_230, __p1_230, __p2_230, __p3_230) __extension__ ({ \ 43376 bfloat16x8_t __ret_230; \ 43377 bfloat16x8_t __s0_230 = __p0_230; \ 43378 bfloat16x4_t __s2_230 = __p2_230; \ 43379 __ret_230 = vsetq_lane_bf16(vget_lane_bf16(__s2_230, __p3_230), __s0_230, __p1_230); \ 43380 __ret_230; \ 43381 }) 43382 #else 43383 #define vcopyq_lane_bf16(__p0_231, __p1_231, __p2_231, __p3_231) __extension__ ({ \ 43384 bfloat16x8_t __ret_231; \ 43385 bfloat16x8_t __s0_231 = __p0_231; \ 43386 bfloat16x4_t __s2_231 = __p2_231; \ 43387 bfloat16x8_t __rev0_231; __rev0_231 = __builtin_shufflevector(__s0_231, __s0_231, 7, 6, 5, 4, 3, 2, 1, 0); \ 43388 bfloat16x4_t __rev2_231; __rev2_231 = __builtin_shufflevector(__s2_231, __s2_231, 3, 2, 1, 0); \ 43389 __ret_231 = __noswap_vsetq_lane_bf16(__noswap_vget_lane_bf16(__rev2_231, __p3_231), __rev0_231, __p1_231); \ 43390 __ret_231 = __builtin_shufflevector(__ret_231, __ret_231, 7, 6, 5, 4, 3, 2, 1, 0); \ 43391 __ret_231; \ 43392 }) 43393 #endif 43394 43395 #ifdef __LITTLE_ENDIAN__ 43396 #define vcopy_lane_bf16(__p0_232, __p1_232, __p2_232, __p3_232) __extension__ ({ \ 43397 bfloat16x4_t __ret_232; \ 43398 bfloat16x4_t __s0_232 = __p0_232; \ 43399 bfloat16x4_t __s2_232 = __p2_232; \ 43400 __ret_232 = vset_lane_bf16(vget_lane_bf16(__s2_232, __p3_232), __s0_232, __p1_232); \ 43401 __ret_232; \ 43402 }) 43403 #else 43404 #define vcopy_lane_bf16(__p0_233, __p1_233, __p2_233, __p3_233) __extension__ ({ \ 43405 bfloat16x4_t __ret_233; \ 43406 bfloat16x4_t __s0_233 = __p0_233; \ 43407 bfloat16x4_t __s2_233 = __p2_233; \ 43408 bfloat16x4_t __rev0_233; __rev0_233 = __builtin_shufflevector(__s0_233, __s0_233, 3, 2, 1, 0); \ 43409 bfloat16x4_t __rev2_233; __rev2_233 = __builtin_shufflevector(__s2_233, __s2_233, 3, 2, 1, 0); \ 43410 __ret_233 = __noswap_vset_lane_bf16(__noswap_vget_lane_bf16(__rev2_233, __p3_233), __rev0_233, __p1_233); \ 43411 __ret_233 = __builtin_shufflevector(__ret_233, __ret_233, 3, 2, 1, 0); \ 43412 __ret_233; \ 43413 }) 43414 #endif 43415 43416 #ifdef __LITTLE_ENDIAN__ 43417 #define vcopyq_laneq_bf16(__p0_234, __p1_234, __p2_234, __p3_234) __extension__ ({ \ 43418 bfloat16x8_t __ret_234; \ 43419 bfloat16x8_t __s0_234 = __p0_234; \ 43420 bfloat16x8_t __s2_234 = __p2_234; \ 43421 __ret_234 = vsetq_lane_bf16(vgetq_lane_bf16(__s2_234, __p3_234), __s0_234, __p1_234); \ 43422 __ret_234; \ 43423 }) 43424 #else 43425 #define vcopyq_laneq_bf16(__p0_235, __p1_235, __p2_235, __p3_235) __extension__ ({ \ 43426 bfloat16x8_t __ret_235; \ 43427 bfloat16x8_t __s0_235 = __p0_235; \ 43428 bfloat16x8_t __s2_235 = __p2_235; \ 43429 bfloat16x8_t __rev0_235; __rev0_235 = __builtin_shufflevector(__s0_235, __s0_235, 7, 6, 5, 4, 3, 2, 1, 0); \ 43430 bfloat16x8_t __rev2_235; __rev2_235 = __builtin_shufflevector(__s2_235, __s2_235, 7, 6, 5, 4, 3, 2, 1, 0); \ 43431 __ret_235 = __noswap_vsetq_lane_bf16(__noswap_vgetq_lane_bf16(__rev2_235, __p3_235), __rev0_235, __p1_235); \ 43432 __ret_235 = __builtin_shufflevector(__ret_235, __ret_235, 7, 6, 5, 4, 3, 2, 1, 0); \ 43433 __ret_235; \ 43434 }) 43435 #endif 43436 43437 #ifdef __LITTLE_ENDIAN__ 43438 #define vcopy_laneq_bf16(__p0_236, __p1_236, __p2_236, __p3_236) __extension__ ({ \ 43439 bfloat16x4_t __ret_236; \ 43440 bfloat16x4_t __s0_236 = __p0_236; \ 43441 bfloat16x8_t __s2_236 = __p2_236; \ 43442 __ret_236 = vset_lane_bf16(vgetq_lane_bf16(__s2_236, __p3_236), __s0_236, __p1_236); \ 43443 __ret_236; \ 43444 }) 43445 #else 43446 #define vcopy_laneq_bf16(__p0_237, __p1_237, __p2_237, __p3_237) __extension__ ({ \ 43447 bfloat16x4_t __ret_237; \ 43448 bfloat16x4_t __s0_237 = __p0_237; \ 43449 bfloat16x8_t __s2_237 = __p2_237; \ 43450 bfloat16x4_t __rev0_237; __rev0_237 = __builtin_shufflevector(__s0_237, __s0_237, 3, 2, 1, 0); \ 43451 bfloat16x8_t __rev2_237; __rev2_237 = __builtin_shufflevector(__s2_237, __s2_237, 7, 6, 5, 4, 3, 2, 1, 0); \ 43452 __ret_237 = __noswap_vset_lane_bf16(__noswap_vgetq_lane_bf16(__rev2_237, __p3_237), __rev0_237, __p1_237); \ 43453 __ret_237 = __builtin_shufflevector(__ret_237, __ret_237, 3, 2, 1, 0); \ 43454 __ret_237; \ 43455 }) 43456 #endif 43457 43458 #ifdef __LITTLE_ENDIAN__ 43459 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vcvt_bf16_f32(float32x4_t __p0) { 43460 bfloat16x4_t __ret; 43461 __ret = (bfloat16x4_t) __builtin_neon_vcvt_bf16_f32((int8x16_t)__p0, 11); 43462 return __ret; 43463 } 43464 #else 43465 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vcvt_bf16_f32(float32x4_t __p0) { 43466 bfloat16x4_t __ret; 43467 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 43468 __ret = (bfloat16x4_t) __builtin_neon_vcvt_bf16_f32((int8x16_t)__rev0, 11); 43469 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 43470 return __ret; 43471 } 43472 #endif 43473 43474 #ifdef __LITTLE_ENDIAN__ 43475 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vcvtq_high_bf16_f32(bfloat16x8_t __p0, float32x4_t __p1) { 43476 bfloat16x8_t __ret; 43477 __ret = (bfloat16x8_t) __builtin_neon_vcvtq_high_bf16_f32((int8x16_t)__p0, (int8x16_t)__p1, 43); 43478 return __ret; 43479 } 43480 #else 43481 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vcvtq_high_bf16_f32(bfloat16x8_t __p0, float32x4_t __p1) { 43482 bfloat16x8_t __ret; 43483 bfloat16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 43484 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 43485 __ret = (bfloat16x8_t) __builtin_neon_vcvtq_high_bf16_f32((int8x16_t)__rev0, (int8x16_t)__rev1, 43); 43486 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 43487 return __ret; 43488 } 43489 #endif 43490 43491 #ifdef __LITTLE_ENDIAN__ 43492 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vcvtq_low_bf16_f32(float32x4_t __p0) { 43493 bfloat16x8_t __ret; 43494 __ret = (bfloat16x8_t) __builtin_neon_vcvtq_low_bf16_f32((int8x16_t)__p0, 43); 43495 return __ret; 43496 } 43497 #else 43498 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vcvtq_low_bf16_f32(float32x4_t __p0) { 43499 bfloat16x8_t __ret; 43500 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 43501 __ret = (bfloat16x8_t) __builtin_neon_vcvtq_low_bf16_f32((int8x16_t)__rev0, 43); 43502 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 43503 return __ret; 43504 } 43505 #endif 43506 43507 __ai __attribute__((target("bf16,neon"))) poly8x8_t vreinterpret_p8_bf16(bfloat16x4_t __p0) { 43508 poly8x8_t __ret; 43509 __ret = (poly8x8_t)(__p0); 43510 return __ret; 43511 } 43512 __ai __attribute__((target("bf16,neon"))) poly64x1_t vreinterpret_p64_bf16(bfloat16x4_t __p0) { 43513 poly64x1_t __ret; 43514 __ret = (poly64x1_t)(__p0); 43515 return __ret; 43516 } 43517 __ai __attribute__((target("bf16,neon"))) poly16x4_t vreinterpret_p16_bf16(bfloat16x4_t __p0) { 43518 poly16x4_t __ret; 43519 __ret = (poly16x4_t)(__p0); 43520 return __ret; 43521 } 43522 __ai __attribute__((target("bf16,neon"))) poly8x16_t vreinterpretq_p8_bf16(bfloat16x8_t __p0) { 43523 poly8x16_t __ret; 43524 __ret = (poly8x16_t)(__p0); 43525 return __ret; 43526 } 43527 __ai __attribute__((target("bf16,neon"))) poly128_t vreinterpretq_p128_bf16(bfloat16x8_t __p0) { 43528 poly128_t __ret; 43529 __ret = (poly128_t)(__p0); 43530 return __ret; 43531 } 43532 __ai __attribute__((target("bf16,neon"))) poly64x2_t vreinterpretq_p64_bf16(bfloat16x8_t __p0) { 43533 poly64x2_t __ret; 43534 __ret = (poly64x2_t)(__p0); 43535 return __ret; 43536 } 43537 __ai __attribute__((target("bf16,neon"))) poly16x8_t vreinterpretq_p16_bf16(bfloat16x8_t __p0) { 43538 poly16x8_t __ret; 43539 __ret = (poly16x8_t)(__p0); 43540 return __ret; 43541 } 43542 __ai __attribute__((target("bf16,neon"))) uint8x16_t vreinterpretq_u8_bf16(bfloat16x8_t __p0) { 43543 uint8x16_t __ret; 43544 __ret = (uint8x16_t)(__p0); 43545 return __ret; 43546 } 43547 __ai __attribute__((target("bf16,neon"))) uint32x4_t vreinterpretq_u32_bf16(bfloat16x8_t __p0) { 43548 uint32x4_t __ret; 43549 __ret = (uint32x4_t)(__p0); 43550 return __ret; 43551 } 43552 __ai __attribute__((target("bf16,neon"))) uint64x2_t vreinterpretq_u64_bf16(bfloat16x8_t __p0) { 43553 uint64x2_t __ret; 43554 __ret = (uint64x2_t)(__p0); 43555 return __ret; 43556 } 43557 __ai __attribute__((target("bf16,neon"))) uint16x8_t vreinterpretq_u16_bf16(bfloat16x8_t __p0) { 43558 uint16x8_t __ret; 43559 __ret = (uint16x8_t)(__p0); 43560 return __ret; 43561 } 43562 __ai __attribute__((target("bf16,neon"))) int8x16_t vreinterpretq_s8_bf16(bfloat16x8_t __p0) { 43563 int8x16_t __ret; 43564 __ret = (int8x16_t)(__p0); 43565 return __ret; 43566 } 43567 __ai __attribute__((target("bf16,neon"))) float64x2_t vreinterpretq_f64_bf16(bfloat16x8_t __p0) { 43568 float64x2_t __ret; 43569 __ret = (float64x2_t)(__p0); 43570 return __ret; 43571 } 43572 __ai __attribute__((target("bf16,neon"))) float32x4_t vreinterpretq_f32_bf16(bfloat16x8_t __p0) { 43573 float32x4_t __ret; 43574 __ret = (float32x4_t)(__p0); 43575 return __ret; 43576 } 43577 __ai __attribute__((target("bf16,neon"))) float16x8_t vreinterpretq_f16_bf16(bfloat16x8_t __p0) { 43578 float16x8_t __ret; 43579 __ret = (float16x8_t)(__p0); 43580 return __ret; 43581 } 43582 __ai __attribute__((target("bf16,neon"))) int32x4_t vreinterpretq_s32_bf16(bfloat16x8_t __p0) { 43583 int32x4_t __ret; 43584 __ret = (int32x4_t)(__p0); 43585 return __ret; 43586 } 43587 __ai __attribute__((target("bf16,neon"))) int64x2_t vreinterpretq_s64_bf16(bfloat16x8_t __p0) { 43588 int64x2_t __ret; 43589 __ret = (int64x2_t)(__p0); 43590 return __ret; 43591 } 43592 __ai __attribute__((target("bf16,neon"))) int16x8_t vreinterpretq_s16_bf16(bfloat16x8_t __p0) { 43593 int16x8_t __ret; 43594 __ret = (int16x8_t)(__p0); 43595 return __ret; 43596 } 43597 __ai __attribute__((target("bf16,neon"))) uint8x8_t vreinterpret_u8_bf16(bfloat16x4_t __p0) { 43598 uint8x8_t __ret; 43599 __ret = (uint8x8_t)(__p0); 43600 return __ret; 43601 } 43602 __ai __attribute__((target("bf16,neon"))) uint32x2_t vreinterpret_u32_bf16(bfloat16x4_t __p0) { 43603 uint32x2_t __ret; 43604 __ret = (uint32x2_t)(__p0); 43605 return __ret; 43606 } 43607 __ai __attribute__((target("bf16,neon"))) uint64x1_t vreinterpret_u64_bf16(bfloat16x4_t __p0) { 43608 uint64x1_t __ret; 43609 __ret = (uint64x1_t)(__p0); 43610 return __ret; 43611 } 43612 __ai __attribute__((target("bf16,neon"))) uint16x4_t vreinterpret_u16_bf16(bfloat16x4_t __p0) { 43613 uint16x4_t __ret; 43614 __ret = (uint16x4_t)(__p0); 43615 return __ret; 43616 } 43617 __ai __attribute__((target("bf16,neon"))) int8x8_t vreinterpret_s8_bf16(bfloat16x4_t __p0) { 43618 int8x8_t __ret; 43619 __ret = (int8x8_t)(__p0); 43620 return __ret; 43621 } 43622 __ai __attribute__((target("bf16,neon"))) float64x1_t vreinterpret_f64_bf16(bfloat16x4_t __p0) { 43623 float64x1_t __ret; 43624 __ret = (float64x1_t)(__p0); 43625 return __ret; 43626 } 43627 __ai __attribute__((target("bf16,neon"))) float32x2_t vreinterpret_f32_bf16(bfloat16x4_t __p0) { 43628 float32x2_t __ret; 43629 __ret = (float32x2_t)(__p0); 43630 return __ret; 43631 } 43632 __ai __attribute__((target("bf16,neon"))) float16x4_t vreinterpret_f16_bf16(bfloat16x4_t __p0) { 43633 float16x4_t __ret; 43634 __ret = (float16x4_t)(__p0); 43635 return __ret; 43636 } 43637 __ai __attribute__((target("bf16,neon"))) int32x2_t vreinterpret_s32_bf16(bfloat16x4_t __p0) { 43638 int32x2_t __ret; 43639 __ret = (int32x2_t)(__p0); 43640 return __ret; 43641 } 43642 __ai __attribute__((target("bf16,neon"))) int64x1_t vreinterpret_s64_bf16(bfloat16x4_t __p0) { 43643 int64x1_t __ret; 43644 __ret = (int64x1_t)(__p0); 43645 return __ret; 43646 } 43647 __ai __attribute__((target("bf16,neon"))) int16x4_t vreinterpret_s16_bf16(bfloat16x4_t __p0) { 43648 int16x4_t __ret; 43649 __ret = (int16x4_t)(__p0); 43650 return __ret; 43651 } 43652 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_p8(poly8x16_t __p0) { 43653 bfloat16x8_t __ret; 43654 __ret = (bfloat16x8_t)(__p0); 43655 return __ret; 43656 } 43657 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_p128(poly128_t __p0) { 43658 bfloat16x8_t __ret; 43659 __ret = (bfloat16x8_t)(__p0); 43660 return __ret; 43661 } 43662 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_p64(poly64x2_t __p0) { 43663 bfloat16x8_t __ret; 43664 __ret = (bfloat16x8_t)(__p0); 43665 return __ret; 43666 } 43667 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_p16(poly16x8_t __p0) { 43668 bfloat16x8_t __ret; 43669 __ret = (bfloat16x8_t)(__p0); 43670 return __ret; 43671 } 43672 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_u8(uint8x16_t __p0) { 43673 bfloat16x8_t __ret; 43674 __ret = (bfloat16x8_t)(__p0); 43675 return __ret; 43676 } 43677 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_u32(uint32x4_t __p0) { 43678 bfloat16x8_t __ret; 43679 __ret = (bfloat16x8_t)(__p0); 43680 return __ret; 43681 } 43682 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_u64(uint64x2_t __p0) { 43683 bfloat16x8_t __ret; 43684 __ret = (bfloat16x8_t)(__p0); 43685 return __ret; 43686 } 43687 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_u16(uint16x8_t __p0) { 43688 bfloat16x8_t __ret; 43689 __ret = (bfloat16x8_t)(__p0); 43690 return __ret; 43691 } 43692 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_s8(int8x16_t __p0) { 43693 bfloat16x8_t __ret; 43694 __ret = (bfloat16x8_t)(__p0); 43695 return __ret; 43696 } 43697 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_f64(float64x2_t __p0) { 43698 bfloat16x8_t __ret; 43699 __ret = (bfloat16x8_t)(__p0); 43700 return __ret; 43701 } 43702 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_f32(float32x4_t __p0) { 43703 bfloat16x8_t __ret; 43704 __ret = (bfloat16x8_t)(__p0); 43705 return __ret; 43706 } 43707 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_f16(float16x8_t __p0) { 43708 bfloat16x8_t __ret; 43709 __ret = (bfloat16x8_t)(__p0); 43710 return __ret; 43711 } 43712 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_s32(int32x4_t __p0) { 43713 bfloat16x8_t __ret; 43714 __ret = (bfloat16x8_t)(__p0); 43715 return __ret; 43716 } 43717 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_s64(int64x2_t __p0) { 43718 bfloat16x8_t __ret; 43719 __ret = (bfloat16x8_t)(__p0); 43720 return __ret; 43721 } 43722 __ai __attribute__((target("bf16,neon"))) bfloat16x8_t vreinterpretq_bf16_s16(int16x8_t __p0) { 43723 bfloat16x8_t __ret; 43724 __ret = (bfloat16x8_t)(__p0); 43725 return __ret; 43726 } 43727 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_p8(poly8x8_t __p0) { 43728 bfloat16x4_t __ret; 43729 __ret = (bfloat16x4_t)(__p0); 43730 return __ret; 43731 } 43732 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_p64(poly64x1_t __p0) { 43733 bfloat16x4_t __ret; 43734 __ret = (bfloat16x4_t)(__p0); 43735 return __ret; 43736 } 43737 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_p16(poly16x4_t __p0) { 43738 bfloat16x4_t __ret; 43739 __ret = (bfloat16x4_t)(__p0); 43740 return __ret; 43741 } 43742 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_u8(uint8x8_t __p0) { 43743 bfloat16x4_t __ret; 43744 __ret = (bfloat16x4_t)(__p0); 43745 return __ret; 43746 } 43747 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_u32(uint32x2_t __p0) { 43748 bfloat16x4_t __ret; 43749 __ret = (bfloat16x4_t)(__p0); 43750 return __ret; 43751 } 43752 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_u64(uint64x1_t __p0) { 43753 bfloat16x4_t __ret; 43754 __ret = (bfloat16x4_t)(__p0); 43755 return __ret; 43756 } 43757 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_u16(uint16x4_t __p0) { 43758 bfloat16x4_t __ret; 43759 __ret = (bfloat16x4_t)(__p0); 43760 return __ret; 43761 } 43762 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_s8(int8x8_t __p0) { 43763 bfloat16x4_t __ret; 43764 __ret = (bfloat16x4_t)(__p0); 43765 return __ret; 43766 } 43767 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_f64(float64x1_t __p0) { 43768 bfloat16x4_t __ret; 43769 __ret = (bfloat16x4_t)(__p0); 43770 return __ret; 43771 } 43772 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_f32(float32x2_t __p0) { 43773 bfloat16x4_t __ret; 43774 __ret = (bfloat16x4_t)(__p0); 43775 return __ret; 43776 } 43777 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_f16(float16x4_t __p0) { 43778 bfloat16x4_t __ret; 43779 __ret = (bfloat16x4_t)(__p0); 43780 return __ret; 43781 } 43782 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_s32(int32x2_t __p0) { 43783 bfloat16x4_t __ret; 43784 __ret = (bfloat16x4_t)(__p0); 43785 return __ret; 43786 } 43787 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_s64(int64x1_t __p0) { 43788 bfloat16x4_t __ret; 43789 __ret = (bfloat16x4_t)(__p0); 43790 return __ret; 43791 } 43792 __ai __attribute__((target("bf16,neon"))) bfloat16x4_t vreinterpret_bf16_s16(int16x4_t __p0) { 43793 bfloat16x4_t __ret; 43794 __ret = (bfloat16x4_t)(__p0); 43795 return __ret; 43796 } 43797 #ifdef __LITTLE_ENDIAN__ 43798 #define vdotq_laneq_u32(__p0_238, __p1_238, __p2_238, __p3_238) __extension__ ({ \ 43799 uint32x4_t __ret_238; \ 43800 uint32x4_t __s0_238 = __p0_238; \ 43801 uint8x16_t __s1_238 = __p1_238; \ 43802 uint8x16_t __s2_238 = __p2_238; \ 43803 __ret_238 = vdotq_u32(__s0_238, __s1_238, __builtin_bit_cast(uint8x16_t, splatq_laneq_u32(__builtin_bit_cast(uint32x4_t, __s2_238), __p3_238))); \ 43804 __ret_238; \ 43805 }) 43806 #else 43807 #define vdotq_laneq_u32(__p0_239, __p1_239, __p2_239, __p3_239) __extension__ ({ \ 43808 uint32x4_t __ret_239; \ 43809 uint32x4_t __s0_239 = __p0_239; \ 43810 uint8x16_t __s1_239 = __p1_239; \ 43811 uint8x16_t __s2_239 = __p2_239; \ 43812 uint32x4_t __rev0_239; __rev0_239 = __builtin_shufflevector(__s0_239, __s0_239, 3, 2, 1, 0); \ 43813 uint8x16_t __rev1_239; __rev1_239 = __builtin_shufflevector(__s1_239, __s1_239, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 43814 uint8x16_t __rev2_239; __rev2_239 = __builtin_shufflevector(__s2_239, __s2_239, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 43815 __ret_239 = __noswap_vdotq_u32(__rev0_239, __rev1_239, __builtin_bit_cast(uint8x16_t, __noswap_splatq_laneq_u32(__builtin_bit_cast(uint32x4_t, __rev2_239), __p3_239))); \ 43816 __ret_239 = __builtin_shufflevector(__ret_239, __ret_239, 3, 2, 1, 0); \ 43817 __ret_239; \ 43818 }) 43819 #endif 43820 43821 #ifdef __LITTLE_ENDIAN__ 43822 #define vdotq_laneq_s32(__p0_240, __p1_240, __p2_240, __p3_240) __extension__ ({ \ 43823 int32x4_t __ret_240; \ 43824 int32x4_t __s0_240 = __p0_240; \ 43825 int8x16_t __s1_240 = __p1_240; \ 43826 int8x16_t __s2_240 = __p2_240; \ 43827 __ret_240 = vdotq_s32(__s0_240, __s1_240, __builtin_bit_cast(int8x16_t, splatq_laneq_s32(__builtin_bit_cast(int32x4_t, __s2_240), __p3_240))); \ 43828 __ret_240; \ 43829 }) 43830 #else 43831 #define vdotq_laneq_s32(__p0_241, __p1_241, __p2_241, __p3_241) __extension__ ({ \ 43832 int32x4_t __ret_241; \ 43833 int32x4_t __s0_241 = __p0_241; \ 43834 int8x16_t __s1_241 = __p1_241; \ 43835 int8x16_t __s2_241 = __p2_241; \ 43836 int32x4_t __rev0_241; __rev0_241 = __builtin_shufflevector(__s0_241, __s0_241, 3, 2, 1, 0); \ 43837 int8x16_t __rev1_241; __rev1_241 = __builtin_shufflevector(__s1_241, __s1_241, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 43838 int8x16_t __rev2_241; __rev2_241 = __builtin_shufflevector(__s2_241, __s2_241, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 43839 __ret_241 = __noswap_vdotq_s32(__rev0_241, __rev1_241, __builtin_bit_cast(int8x16_t, __noswap_splatq_laneq_s32(__builtin_bit_cast(int32x4_t, __rev2_241), __p3_241))); \ 43840 __ret_241 = __builtin_shufflevector(__ret_241, __ret_241, 3, 2, 1, 0); \ 43841 __ret_241; \ 43842 }) 43843 #endif 43844 43845 #ifdef __LITTLE_ENDIAN__ 43846 #define vdot_laneq_u32(__p0_242, __p1_242, __p2_242, __p3_242) __extension__ ({ \ 43847 uint32x2_t __ret_242; \ 43848 uint32x2_t __s0_242 = __p0_242; \ 43849 uint8x8_t __s1_242 = __p1_242; \ 43850 uint8x16_t __s2_242 = __p2_242; \ 43851 __ret_242 = vdot_u32(__s0_242, __s1_242, __builtin_bit_cast(uint8x8_t, splat_laneq_u32(__builtin_bit_cast(uint32x4_t, __s2_242), __p3_242))); \ 43852 __ret_242; \ 43853 }) 43854 #else 43855 #define vdot_laneq_u32(__p0_243, __p1_243, __p2_243, __p3_243) __extension__ ({ \ 43856 uint32x2_t __ret_243; \ 43857 uint32x2_t __s0_243 = __p0_243; \ 43858 uint8x8_t __s1_243 = __p1_243; \ 43859 uint8x16_t __s2_243 = __p2_243; \ 43860 uint32x2_t __rev0_243; __rev0_243 = __builtin_shufflevector(__s0_243, __s0_243, 1, 0); \ 43861 uint8x8_t __rev1_243; __rev1_243 = __builtin_shufflevector(__s1_243, __s1_243, 7, 6, 5, 4, 3, 2, 1, 0); \ 43862 uint8x16_t __rev2_243; __rev2_243 = __builtin_shufflevector(__s2_243, __s2_243, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 43863 __ret_243 = __noswap_vdot_u32(__rev0_243, __rev1_243, __builtin_bit_cast(uint8x8_t, __noswap_splat_laneq_u32(__builtin_bit_cast(uint32x4_t, __rev2_243), __p3_243))); \ 43864 __ret_243 = __builtin_shufflevector(__ret_243, __ret_243, 1, 0); \ 43865 __ret_243; \ 43866 }) 43867 #endif 43868 43869 #ifdef __LITTLE_ENDIAN__ 43870 #define vdot_laneq_s32(__p0_244, __p1_244, __p2_244, __p3_244) __extension__ ({ \ 43871 int32x2_t __ret_244; \ 43872 int32x2_t __s0_244 = __p0_244; \ 43873 int8x8_t __s1_244 = __p1_244; \ 43874 int8x16_t __s2_244 = __p2_244; \ 43875 __ret_244 = vdot_s32(__s0_244, __s1_244, __builtin_bit_cast(int8x8_t, splat_laneq_s32(__builtin_bit_cast(int32x4_t, __s2_244), __p3_244))); \ 43876 __ret_244; \ 43877 }) 43878 #else 43879 #define vdot_laneq_s32(__p0_245, __p1_245, __p2_245, __p3_245) __extension__ ({ \ 43880 int32x2_t __ret_245; \ 43881 int32x2_t __s0_245 = __p0_245; \ 43882 int8x8_t __s1_245 = __p1_245; \ 43883 int8x16_t __s2_245 = __p2_245; \ 43884 int32x2_t __rev0_245; __rev0_245 = __builtin_shufflevector(__s0_245, __s0_245, 1, 0); \ 43885 int8x8_t __rev1_245; __rev1_245 = __builtin_shufflevector(__s1_245, __s1_245, 7, 6, 5, 4, 3, 2, 1, 0); \ 43886 int8x16_t __rev2_245; __rev2_245 = __builtin_shufflevector(__s2_245, __s2_245, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 43887 __ret_245 = __noswap_vdot_s32(__rev0_245, __rev1_245, __builtin_bit_cast(int8x8_t, __noswap_splat_laneq_s32(__builtin_bit_cast(int32x4_t, __rev2_245), __p3_245))); \ 43888 __ret_245 = __builtin_shufflevector(__ret_245, __ret_245, 1, 0); \ 43889 __ret_245; \ 43890 }) 43891 #endif 43892 43893 #ifdef __LITTLE_ENDIAN__ 43894 __ai __attribute__((target("fp16fml,neon"))) float32x4_t vfmlalq_high_f16(float32x4_t __p0, float16x8_t __p1, float16x8_t __p2) { 43895 float32x4_t __ret; 43896 __ret = (float32x4_t) __builtin_neon_vfmlalq_high_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41); 43897 return __ret; 43898 } 43899 #else 43900 __ai __attribute__((target("fp16fml,neon"))) float32x4_t vfmlalq_high_f16(float32x4_t __p0, float16x8_t __p1, float16x8_t __p2) { 43901 float32x4_t __ret; 43902 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 43903 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 43904 float16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 43905 __ret = (float32x4_t) __builtin_neon_vfmlalq_high_f16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 41); 43906 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 43907 return __ret; 43908 } 43909 __ai __attribute__((target("fp16fml,neon"))) float32x4_t __noswap_vfmlalq_high_f16(float32x4_t __p0, float16x8_t __p1, float16x8_t __p2) { 43910 float32x4_t __ret; 43911 __ret = (float32x4_t) __builtin_neon_vfmlalq_high_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41); 43912 return __ret; 43913 } 43914 #endif 43915 43916 #ifdef __LITTLE_ENDIAN__ 43917 __ai __attribute__((target("fp16fml,neon"))) float32x2_t vfmlal_high_f16(float32x2_t __p0, float16x4_t __p1, float16x4_t __p2) { 43918 float32x2_t __ret; 43919 __ret = (float32x2_t) __builtin_neon_vfmlal_high_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9); 43920 return __ret; 43921 } 43922 #else 43923 __ai __attribute__((target("fp16fml,neon"))) float32x2_t vfmlal_high_f16(float32x2_t __p0, float16x4_t __p1, float16x4_t __p2) { 43924 float32x2_t __ret; 43925 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 43926 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 43927 float16x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 43928 __ret = (float32x2_t) __builtin_neon_vfmlal_high_f16((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 9); 43929 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 43930 return __ret; 43931 } 43932 __ai __attribute__((target("fp16fml,neon"))) float32x2_t __noswap_vfmlal_high_f16(float32x2_t __p0, float16x4_t __p1, float16x4_t __p2) { 43933 float32x2_t __ret; 43934 __ret = (float32x2_t) __builtin_neon_vfmlal_high_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9); 43935 return __ret; 43936 } 43937 #endif 43938 43939 #ifdef __LITTLE_ENDIAN__ 43940 __ai __attribute__((target("fp16fml,neon"))) float32x4_t vfmlalq_low_f16(float32x4_t __p0, float16x8_t __p1, float16x8_t __p2) { 43941 float32x4_t __ret; 43942 __ret = (float32x4_t) __builtin_neon_vfmlalq_low_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41); 43943 return __ret; 43944 } 43945 #else 43946 __ai __attribute__((target("fp16fml,neon"))) float32x4_t vfmlalq_low_f16(float32x4_t __p0, float16x8_t __p1, float16x8_t __p2) { 43947 float32x4_t __ret; 43948 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 43949 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 43950 float16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 43951 __ret = (float32x4_t) __builtin_neon_vfmlalq_low_f16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 41); 43952 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 43953 return __ret; 43954 } 43955 __ai __attribute__((target("fp16fml,neon"))) float32x4_t __noswap_vfmlalq_low_f16(float32x4_t __p0, float16x8_t __p1, float16x8_t __p2) { 43956 float32x4_t __ret; 43957 __ret = (float32x4_t) __builtin_neon_vfmlalq_low_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41); 43958 return __ret; 43959 } 43960 #endif 43961 43962 #ifdef __LITTLE_ENDIAN__ 43963 __ai __attribute__((target("fp16fml,neon"))) float32x2_t vfmlal_low_f16(float32x2_t __p0, float16x4_t __p1, float16x4_t __p2) { 43964 float32x2_t __ret; 43965 __ret = (float32x2_t) __builtin_neon_vfmlal_low_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9); 43966 return __ret; 43967 } 43968 #else 43969 __ai __attribute__((target("fp16fml,neon"))) float32x2_t vfmlal_low_f16(float32x2_t __p0, float16x4_t __p1, float16x4_t __p2) { 43970 float32x2_t __ret; 43971 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 43972 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 43973 float16x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 43974 __ret = (float32x2_t) __builtin_neon_vfmlal_low_f16((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 9); 43975 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 43976 return __ret; 43977 } 43978 __ai __attribute__((target("fp16fml,neon"))) float32x2_t __noswap_vfmlal_low_f16(float32x2_t __p0, float16x4_t __p1, float16x4_t __p2) { 43979 float32x2_t __ret; 43980 __ret = (float32x2_t) __builtin_neon_vfmlal_low_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9); 43981 return __ret; 43982 } 43983 #endif 43984 43985 #ifdef __LITTLE_ENDIAN__ 43986 __ai __attribute__((target("fp16fml,neon"))) float32x4_t vfmlslq_high_f16(float32x4_t __p0, float16x8_t __p1, float16x8_t __p2) { 43987 float32x4_t __ret; 43988 __ret = (float32x4_t) __builtin_neon_vfmlslq_high_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41); 43989 return __ret; 43990 } 43991 #else 43992 __ai __attribute__((target("fp16fml,neon"))) float32x4_t vfmlslq_high_f16(float32x4_t __p0, float16x8_t __p1, float16x8_t __p2) { 43993 float32x4_t __ret; 43994 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 43995 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 43996 float16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 43997 __ret = (float32x4_t) __builtin_neon_vfmlslq_high_f16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 41); 43998 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 43999 return __ret; 44000 } 44001 __ai __attribute__((target("fp16fml,neon"))) float32x4_t __noswap_vfmlslq_high_f16(float32x4_t __p0, float16x8_t __p1, float16x8_t __p2) { 44002 float32x4_t __ret; 44003 __ret = (float32x4_t) __builtin_neon_vfmlslq_high_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41); 44004 return __ret; 44005 } 44006 #endif 44007 44008 #ifdef __LITTLE_ENDIAN__ 44009 __ai __attribute__((target("fp16fml,neon"))) float32x2_t vfmlsl_high_f16(float32x2_t __p0, float16x4_t __p1, float16x4_t __p2) { 44010 float32x2_t __ret; 44011 __ret = (float32x2_t) __builtin_neon_vfmlsl_high_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9); 44012 return __ret; 44013 } 44014 #else 44015 __ai __attribute__((target("fp16fml,neon"))) float32x2_t vfmlsl_high_f16(float32x2_t __p0, float16x4_t __p1, float16x4_t __p2) { 44016 float32x2_t __ret; 44017 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 44018 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 44019 float16x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 44020 __ret = (float32x2_t) __builtin_neon_vfmlsl_high_f16((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 9); 44021 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 44022 return __ret; 44023 } 44024 __ai __attribute__((target("fp16fml,neon"))) float32x2_t __noswap_vfmlsl_high_f16(float32x2_t __p0, float16x4_t __p1, float16x4_t __p2) { 44025 float32x2_t __ret; 44026 __ret = (float32x2_t) __builtin_neon_vfmlsl_high_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9); 44027 return __ret; 44028 } 44029 #endif 44030 44031 #ifdef __LITTLE_ENDIAN__ 44032 __ai __attribute__((target("fp16fml,neon"))) float32x4_t vfmlslq_low_f16(float32x4_t __p0, float16x8_t __p1, float16x8_t __p2) { 44033 float32x4_t __ret; 44034 __ret = (float32x4_t) __builtin_neon_vfmlslq_low_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41); 44035 return __ret; 44036 } 44037 #else 44038 __ai __attribute__((target("fp16fml,neon"))) float32x4_t vfmlslq_low_f16(float32x4_t __p0, float16x8_t __p1, float16x8_t __p2) { 44039 float32x4_t __ret; 44040 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 44041 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 44042 float16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 44043 __ret = (float32x4_t) __builtin_neon_vfmlslq_low_f16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 41); 44044 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 44045 return __ret; 44046 } 44047 __ai __attribute__((target("fp16fml,neon"))) float32x4_t __noswap_vfmlslq_low_f16(float32x4_t __p0, float16x8_t __p1, float16x8_t __p2) { 44048 float32x4_t __ret; 44049 __ret = (float32x4_t) __builtin_neon_vfmlslq_low_f16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 41); 44050 return __ret; 44051 } 44052 #endif 44053 44054 #ifdef __LITTLE_ENDIAN__ 44055 __ai __attribute__((target("fp16fml,neon"))) float32x2_t vfmlsl_low_f16(float32x2_t __p0, float16x4_t __p1, float16x4_t __p2) { 44056 float32x2_t __ret; 44057 __ret = (float32x2_t) __builtin_neon_vfmlsl_low_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9); 44058 return __ret; 44059 } 44060 #else 44061 __ai __attribute__((target("fp16fml,neon"))) float32x2_t vfmlsl_low_f16(float32x2_t __p0, float16x4_t __p1, float16x4_t __p2) { 44062 float32x2_t __ret; 44063 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 44064 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 44065 float16x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 44066 __ret = (float32x2_t) __builtin_neon_vfmlsl_low_f16((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, 9); 44067 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 44068 return __ret; 44069 } 44070 __ai __attribute__((target("fp16fml,neon"))) float32x2_t __noswap_vfmlsl_low_f16(float32x2_t __p0, float16x4_t __p1, float16x4_t __p2) { 44071 float32x2_t __ret; 44072 __ret = (float32x2_t) __builtin_neon_vfmlsl_low_f16((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 9); 44073 return __ret; 44074 } 44075 #endif 44076 44077 #ifdef __LITTLE_ENDIAN__ 44078 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vdivq_f16(float16x8_t __p0, float16x8_t __p1) { 44079 float16x8_t __ret; 44080 __ret = __p0 / __p1; 44081 return __ret; 44082 } 44083 #else 44084 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vdivq_f16(float16x8_t __p0, float16x8_t __p1) { 44085 float16x8_t __ret; 44086 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 44087 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 44088 __ret = __rev0 / __rev1; 44089 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 44090 return __ret; 44091 } 44092 #endif 44093 44094 #ifdef __LITTLE_ENDIAN__ 44095 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vdiv_f16(float16x4_t __p0, float16x4_t __p1) { 44096 float16x4_t __ret; 44097 __ret = __p0 / __p1; 44098 return __ret; 44099 } 44100 #else 44101 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vdiv_f16(float16x4_t __p0, float16x4_t __p1) { 44102 float16x4_t __ret; 44103 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 44104 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 44105 __ret = __rev0 / __rev1; 44106 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 44107 return __ret; 44108 } 44109 #endif 44110 44111 #ifdef __LITTLE_ENDIAN__ 44112 #define vfmah_lane_f16(__p0, __p1, __p2, __p3) __extension__ ({ \ 44113 float16_t __ret; \ 44114 float16_t __s0 = __p0; \ 44115 float16_t __s1 = __p1; \ 44116 float16x4_t __s2 = __p2; \ 44117 __ret = (float16_t) __builtin_neon_vfmah_lane_f16(__s0, __s1, (float16x4_t)__s2, __p3); \ 44118 __ret; \ 44119 }) 44120 #else 44121 #define vfmah_lane_f16(__p0, __p1, __p2, __p3) __extension__ ({ \ 44122 float16_t __ret; \ 44123 float16_t __s0 = __p0; \ 44124 float16_t __s1 = __p1; \ 44125 float16x4_t __s2 = __p2; \ 44126 float16x4_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 3, 2, 1, 0); \ 44127 __ret = (float16_t) __builtin_neon_vfmah_lane_f16(__s0, __s1, (float16x4_t)__rev2, __p3); \ 44128 __ret; \ 44129 }) 44130 #define __noswap_vfmah_lane_f16(__p0, __p1, __p2, __p3) __extension__ ({ \ 44131 float16_t __ret; \ 44132 float16_t __s0 = __p0; \ 44133 float16_t __s1 = __p1; \ 44134 float16x4_t __s2 = __p2; \ 44135 __ret = (float16_t) __builtin_neon_vfmah_lane_f16(__s0, __s1, (float16x4_t)__s2, __p3); \ 44136 __ret; \ 44137 }) 44138 #endif 44139 44140 #ifdef __LITTLE_ENDIAN__ 44141 #define vfmaq_lane_f16(__p0, __p1, __p2, __p3) __extension__ ({ \ 44142 float16x8_t __ret; \ 44143 float16x8_t __s0 = __p0; \ 44144 float16x8_t __s1 = __p1; \ 44145 float16x4_t __s2 = __p2; \ 44146 __ret = (float16x8_t) __builtin_neon_vfmaq_lane_f16((int8x16_t)__s0, (int8x16_t)__s1, (int8x8_t)__s2, __p3, 40); \ 44147 __ret; \ 44148 }) 44149 #else 44150 #define vfmaq_lane_f16(__p0, __p1, __p2, __p3) __extension__ ({ \ 44151 float16x8_t __ret; \ 44152 float16x8_t __s0 = __p0; \ 44153 float16x8_t __s1 = __p1; \ 44154 float16x4_t __s2 = __p2; \ 44155 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 44156 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 44157 float16x4_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 3, 2, 1, 0); \ 44158 __ret = (float16x8_t) __builtin_neon_vfmaq_lane_f16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x8_t)__rev2, __p3, 40); \ 44159 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 44160 __ret; \ 44161 }) 44162 #define __noswap_vfmaq_lane_f16(__p0, __p1, __p2, __p3) __extension__ ({ \ 44163 float16x8_t __ret; \ 44164 float16x8_t __s0 = __p0; \ 44165 float16x8_t __s1 = __p1; \ 44166 float16x4_t __s2 = __p2; \ 44167 __ret = (float16x8_t) __builtin_neon_vfmaq_lane_f16((int8x16_t)__s0, (int8x16_t)__s1, (int8x8_t)__s2, __p3, 40); \ 44168 __ret; \ 44169 }) 44170 #endif 44171 44172 #ifdef __LITTLE_ENDIAN__ 44173 #define vfma_lane_f16(__p0, __p1, __p2, __p3) __extension__ ({ \ 44174 float16x4_t __ret; \ 44175 float16x4_t __s0 = __p0; \ 44176 float16x4_t __s1 = __p1; \ 44177 float16x4_t __s2 = __p2; \ 44178 __ret = (float16x4_t) __builtin_neon_vfma_lane_f16((int8x8_t)__s0, (int8x8_t)__s1, (int8x8_t)__s2, __p3, 8); \ 44179 __ret; \ 44180 }) 44181 #else 44182 #define vfma_lane_f16(__p0, __p1, __p2, __p3) __extension__ ({ \ 44183 float16x4_t __ret; \ 44184 float16x4_t __s0 = __p0; \ 44185 float16x4_t __s1 = __p1; \ 44186 float16x4_t __s2 = __p2; \ 44187 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 44188 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 44189 float16x4_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 3, 2, 1, 0); \ 44190 __ret = (float16x4_t) __builtin_neon_vfma_lane_f16((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, __p3, 8); \ 44191 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 44192 __ret; \ 44193 }) 44194 #define __noswap_vfma_lane_f16(__p0, __p1, __p2, __p3) __extension__ ({ \ 44195 float16x4_t __ret; \ 44196 float16x4_t __s0 = __p0; \ 44197 float16x4_t __s1 = __p1; \ 44198 float16x4_t __s2 = __p2; \ 44199 __ret = (float16x4_t) __builtin_neon_vfma_lane_f16((int8x8_t)__s0, (int8x8_t)__s1, (int8x8_t)__s2, __p3, 8); \ 44200 __ret; \ 44201 }) 44202 #endif 44203 44204 #ifdef __LITTLE_ENDIAN__ 44205 #define vfmah_laneq_f16(__p0, __p1, __p2, __p3) __extension__ ({ \ 44206 float16_t __ret; \ 44207 float16_t __s0 = __p0; \ 44208 float16_t __s1 = __p1; \ 44209 float16x8_t __s2 = __p2; \ 44210 __ret = (float16_t) __builtin_neon_vfmah_laneq_f16(__s0, __s1, (float16x8_t)__s2, __p3); \ 44211 __ret; \ 44212 }) 44213 #else 44214 #define vfmah_laneq_f16(__p0, __p1, __p2, __p3) __extension__ ({ \ 44215 float16_t __ret; \ 44216 float16_t __s0 = __p0; \ 44217 float16_t __s1 = __p1; \ 44218 float16x8_t __s2 = __p2; \ 44219 float16x8_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 7, 6, 5, 4, 3, 2, 1, 0); \ 44220 __ret = (float16_t) __builtin_neon_vfmah_laneq_f16(__s0, __s1, (float16x8_t)__rev2, __p3); \ 44221 __ret; \ 44222 }) 44223 #define __noswap_vfmah_laneq_f16(__p0, __p1, __p2, __p3) __extension__ ({ \ 44224 float16_t __ret; \ 44225 float16_t __s0 = __p0; \ 44226 float16_t __s1 = __p1; \ 44227 float16x8_t __s2 = __p2; \ 44228 __ret = (float16_t) __builtin_neon_vfmah_laneq_f16(__s0, __s1, (float16x8_t)__s2, __p3); \ 44229 __ret; \ 44230 }) 44231 #endif 44232 44233 #ifdef __LITTLE_ENDIAN__ 44234 #define vfmaq_laneq_f16(__p0, __p1, __p2, __p3) __extension__ ({ \ 44235 float16x8_t __ret; \ 44236 float16x8_t __s0 = __p0; \ 44237 float16x8_t __s1 = __p1; \ 44238 float16x8_t __s2 = __p2; \ 44239 __ret = (float16x8_t) __builtin_neon_vfmaq_laneq_f16((int8x16_t)__s0, (int8x16_t)__s1, (int8x16_t)__s2, __p3, 40); \ 44240 __ret; \ 44241 }) 44242 #else 44243 #define vfmaq_laneq_f16(__p0, __p1, __p2, __p3) __extension__ ({ \ 44244 float16x8_t __ret; \ 44245 float16x8_t __s0 = __p0; \ 44246 float16x8_t __s1 = __p1; \ 44247 float16x8_t __s2 = __p2; \ 44248 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 44249 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 44250 float16x8_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 7, 6, 5, 4, 3, 2, 1, 0); \ 44251 __ret = (float16x8_t) __builtin_neon_vfmaq_laneq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, __p3, 40); \ 44252 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 44253 __ret; \ 44254 }) 44255 #define __noswap_vfmaq_laneq_f16(__p0, __p1, __p2, __p3) __extension__ ({ \ 44256 float16x8_t __ret; \ 44257 float16x8_t __s0 = __p0; \ 44258 float16x8_t __s1 = __p1; \ 44259 float16x8_t __s2 = __p2; \ 44260 __ret = (float16x8_t) __builtin_neon_vfmaq_laneq_f16((int8x16_t)__s0, (int8x16_t)__s1, (int8x16_t)__s2, __p3, 40); \ 44261 __ret; \ 44262 }) 44263 #endif 44264 44265 #ifdef __LITTLE_ENDIAN__ 44266 #define vfma_laneq_f16(__p0, __p1, __p2, __p3) __extension__ ({ \ 44267 float16x4_t __ret; \ 44268 float16x4_t __s0 = __p0; \ 44269 float16x4_t __s1 = __p1; \ 44270 float16x8_t __s2 = __p2; \ 44271 __ret = (float16x4_t) __builtin_neon_vfma_laneq_f16((int8x8_t)__s0, (int8x8_t)__s1, (int8x16_t)__s2, __p3, 8); \ 44272 __ret; \ 44273 }) 44274 #else 44275 #define vfma_laneq_f16(__p0, __p1, __p2, __p3) __extension__ ({ \ 44276 float16x4_t __ret; \ 44277 float16x4_t __s0 = __p0; \ 44278 float16x4_t __s1 = __p1; \ 44279 float16x8_t __s2 = __p2; \ 44280 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 44281 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 44282 float16x8_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 7, 6, 5, 4, 3, 2, 1, 0); \ 44283 __ret = (float16x4_t) __builtin_neon_vfma_laneq_f16((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x16_t)__rev2, __p3, 8); \ 44284 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 44285 __ret; \ 44286 }) 44287 #define __noswap_vfma_laneq_f16(__p0, __p1, __p2, __p3) __extension__ ({ \ 44288 float16x4_t __ret; \ 44289 float16x4_t __s0 = __p0; \ 44290 float16x4_t __s1 = __p1; \ 44291 float16x8_t __s2 = __p2; \ 44292 __ret = (float16x4_t) __builtin_neon_vfma_laneq_f16((int8x8_t)__s0, (int8x8_t)__s1, (int8x16_t)__s2, __p3, 8); \ 44293 __ret; \ 44294 }) 44295 #endif 44296 44297 #ifdef __LITTLE_ENDIAN__ 44298 #define vfmaq_n_f16(__p0, __p1, __p2) __extension__ ({ \ 44299 float16x8_t __ret; \ 44300 float16x8_t __s0 = __p0; \ 44301 float16x8_t __s1 = __p1; \ 44302 float16_t __s2 = __p2; \ 44303 __ret = vfmaq_f16(__s0, __s1, (float16x8_t) {__s2, __s2, __s2, __s2, __s2, __s2, __s2, __s2}); \ 44304 __ret; \ 44305 }) 44306 #else 44307 #define vfmaq_n_f16(__p0, __p1, __p2) __extension__ ({ \ 44308 float16x8_t __ret; \ 44309 float16x8_t __s0 = __p0; \ 44310 float16x8_t __s1 = __p1; \ 44311 float16_t __s2 = __p2; \ 44312 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 44313 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 44314 __ret = __noswap_vfmaq_f16(__rev0, __rev1, (float16x8_t) {__s2, __s2, __s2, __s2, __s2, __s2, __s2, __s2}); \ 44315 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 44316 __ret; \ 44317 }) 44318 #endif 44319 44320 #ifdef __LITTLE_ENDIAN__ 44321 #define vfma_n_f16(__p0, __p1, __p2) __extension__ ({ \ 44322 float16x4_t __ret; \ 44323 float16x4_t __s0 = __p0; \ 44324 float16x4_t __s1 = __p1; \ 44325 float16_t __s2 = __p2; \ 44326 __ret = vfma_f16(__s0, __s1, (float16x4_t) {__s2, __s2, __s2, __s2}); \ 44327 __ret; \ 44328 }) 44329 #else 44330 #define vfma_n_f16(__p0, __p1, __p2) __extension__ ({ \ 44331 float16x4_t __ret; \ 44332 float16x4_t __s0 = __p0; \ 44333 float16x4_t __s1 = __p1; \ 44334 float16_t __s2 = __p2; \ 44335 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 44336 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 44337 __ret = __noswap_vfma_f16(__rev0, __rev1, (float16x4_t) {__s2, __s2, __s2, __s2}); \ 44338 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 44339 __ret; \ 44340 }) 44341 #endif 44342 44343 #ifdef __LITTLE_ENDIAN__ 44344 #define vfmsh_lane_f16(__p0_246, __p1_246, __p2_246, __p3_246) __extension__ ({ \ 44345 float16_t __ret_246; \ 44346 float16_t __s0_246 = __p0_246; \ 44347 float16_t __s1_246 = __p1_246; \ 44348 float16x4_t __s2_246 = __p2_246; \ 44349 __ret_246 = vfmah_lane_f16(__s0_246, -__s1_246, __s2_246, __p3_246); \ 44350 __ret_246; \ 44351 }) 44352 #else 44353 #define vfmsh_lane_f16(__p0_247, __p1_247, __p2_247, __p3_247) __extension__ ({ \ 44354 float16_t __ret_247; \ 44355 float16_t __s0_247 = __p0_247; \ 44356 float16_t __s1_247 = __p1_247; \ 44357 float16x4_t __s2_247 = __p2_247; \ 44358 float16x4_t __rev2_247; __rev2_247 = __builtin_shufflevector(__s2_247, __s2_247, 3, 2, 1, 0); \ 44359 __ret_247 = __noswap_vfmah_lane_f16(__s0_247, -__s1_247, __rev2_247, __p3_247); \ 44360 __ret_247; \ 44361 }) 44362 #endif 44363 44364 #ifdef __LITTLE_ENDIAN__ 44365 #define vfmsq_lane_f16(__p0_248, __p1_248, __p2_248, __p3_248) __extension__ ({ \ 44366 float16x8_t __ret_248; \ 44367 float16x8_t __s0_248 = __p0_248; \ 44368 float16x8_t __s1_248 = __p1_248; \ 44369 float16x4_t __s2_248 = __p2_248; \ 44370 __ret_248 = vfmaq_lane_f16(__s0_248, -__s1_248, __s2_248, __p3_248); \ 44371 __ret_248; \ 44372 }) 44373 #else 44374 #define vfmsq_lane_f16(__p0_249, __p1_249, __p2_249, __p3_249) __extension__ ({ \ 44375 float16x8_t __ret_249; \ 44376 float16x8_t __s0_249 = __p0_249; \ 44377 float16x8_t __s1_249 = __p1_249; \ 44378 float16x4_t __s2_249 = __p2_249; \ 44379 float16x8_t __rev0_249; __rev0_249 = __builtin_shufflevector(__s0_249, __s0_249, 7, 6, 5, 4, 3, 2, 1, 0); \ 44380 float16x8_t __rev1_249; __rev1_249 = __builtin_shufflevector(__s1_249, __s1_249, 7, 6, 5, 4, 3, 2, 1, 0); \ 44381 float16x4_t __rev2_249; __rev2_249 = __builtin_shufflevector(__s2_249, __s2_249, 3, 2, 1, 0); \ 44382 __ret_249 = __noswap_vfmaq_lane_f16(__rev0_249, -__rev1_249, __rev2_249, __p3_249); \ 44383 __ret_249 = __builtin_shufflevector(__ret_249, __ret_249, 7, 6, 5, 4, 3, 2, 1, 0); \ 44384 __ret_249; \ 44385 }) 44386 #endif 44387 44388 #ifdef __LITTLE_ENDIAN__ 44389 #define vfms_lane_f16(__p0_250, __p1_250, __p2_250, __p3_250) __extension__ ({ \ 44390 float16x4_t __ret_250; \ 44391 float16x4_t __s0_250 = __p0_250; \ 44392 float16x4_t __s1_250 = __p1_250; \ 44393 float16x4_t __s2_250 = __p2_250; \ 44394 __ret_250 = vfma_lane_f16(__s0_250, -__s1_250, __s2_250, __p3_250); \ 44395 __ret_250; \ 44396 }) 44397 #else 44398 #define vfms_lane_f16(__p0_251, __p1_251, __p2_251, __p3_251) __extension__ ({ \ 44399 float16x4_t __ret_251; \ 44400 float16x4_t __s0_251 = __p0_251; \ 44401 float16x4_t __s1_251 = __p1_251; \ 44402 float16x4_t __s2_251 = __p2_251; \ 44403 float16x4_t __rev0_251; __rev0_251 = __builtin_shufflevector(__s0_251, __s0_251, 3, 2, 1, 0); \ 44404 float16x4_t __rev1_251; __rev1_251 = __builtin_shufflevector(__s1_251, __s1_251, 3, 2, 1, 0); \ 44405 float16x4_t __rev2_251; __rev2_251 = __builtin_shufflevector(__s2_251, __s2_251, 3, 2, 1, 0); \ 44406 __ret_251 = __noswap_vfma_lane_f16(__rev0_251, -__rev1_251, __rev2_251, __p3_251); \ 44407 __ret_251 = __builtin_shufflevector(__ret_251, __ret_251, 3, 2, 1, 0); \ 44408 __ret_251; \ 44409 }) 44410 #endif 44411 44412 #ifdef __LITTLE_ENDIAN__ 44413 #define vfmsh_laneq_f16(__p0_252, __p1_252, __p2_252, __p3_252) __extension__ ({ \ 44414 float16_t __ret_252; \ 44415 float16_t __s0_252 = __p0_252; \ 44416 float16_t __s1_252 = __p1_252; \ 44417 float16x8_t __s2_252 = __p2_252; \ 44418 __ret_252 = vfmah_laneq_f16(__s0_252, -__s1_252, __s2_252, __p3_252); \ 44419 __ret_252; \ 44420 }) 44421 #else 44422 #define vfmsh_laneq_f16(__p0_253, __p1_253, __p2_253, __p3_253) __extension__ ({ \ 44423 float16_t __ret_253; \ 44424 float16_t __s0_253 = __p0_253; \ 44425 float16_t __s1_253 = __p1_253; \ 44426 float16x8_t __s2_253 = __p2_253; \ 44427 float16x8_t __rev2_253; __rev2_253 = __builtin_shufflevector(__s2_253, __s2_253, 7, 6, 5, 4, 3, 2, 1, 0); \ 44428 __ret_253 = __noswap_vfmah_laneq_f16(__s0_253, -__s1_253, __rev2_253, __p3_253); \ 44429 __ret_253; \ 44430 }) 44431 #endif 44432 44433 #ifdef __LITTLE_ENDIAN__ 44434 #define vfmsq_laneq_f16(__p0_254, __p1_254, __p2_254, __p3_254) __extension__ ({ \ 44435 float16x8_t __ret_254; \ 44436 float16x8_t __s0_254 = __p0_254; \ 44437 float16x8_t __s1_254 = __p1_254; \ 44438 float16x8_t __s2_254 = __p2_254; \ 44439 __ret_254 = vfmaq_laneq_f16(__s0_254, -__s1_254, __s2_254, __p3_254); \ 44440 __ret_254; \ 44441 }) 44442 #else 44443 #define vfmsq_laneq_f16(__p0_255, __p1_255, __p2_255, __p3_255) __extension__ ({ \ 44444 float16x8_t __ret_255; \ 44445 float16x8_t __s0_255 = __p0_255; \ 44446 float16x8_t __s1_255 = __p1_255; \ 44447 float16x8_t __s2_255 = __p2_255; \ 44448 float16x8_t __rev0_255; __rev0_255 = __builtin_shufflevector(__s0_255, __s0_255, 7, 6, 5, 4, 3, 2, 1, 0); \ 44449 float16x8_t __rev1_255; __rev1_255 = __builtin_shufflevector(__s1_255, __s1_255, 7, 6, 5, 4, 3, 2, 1, 0); \ 44450 float16x8_t __rev2_255; __rev2_255 = __builtin_shufflevector(__s2_255, __s2_255, 7, 6, 5, 4, 3, 2, 1, 0); \ 44451 __ret_255 = __noswap_vfmaq_laneq_f16(__rev0_255, -__rev1_255, __rev2_255, __p3_255); \ 44452 __ret_255 = __builtin_shufflevector(__ret_255, __ret_255, 7, 6, 5, 4, 3, 2, 1, 0); \ 44453 __ret_255; \ 44454 }) 44455 #endif 44456 44457 #ifdef __LITTLE_ENDIAN__ 44458 #define vfms_laneq_f16(__p0_256, __p1_256, __p2_256, __p3_256) __extension__ ({ \ 44459 float16x4_t __ret_256; \ 44460 float16x4_t __s0_256 = __p0_256; \ 44461 float16x4_t __s1_256 = __p1_256; \ 44462 float16x8_t __s2_256 = __p2_256; \ 44463 __ret_256 = vfma_laneq_f16(__s0_256, -__s1_256, __s2_256, __p3_256); \ 44464 __ret_256; \ 44465 }) 44466 #else 44467 #define vfms_laneq_f16(__p0_257, __p1_257, __p2_257, __p3_257) __extension__ ({ \ 44468 float16x4_t __ret_257; \ 44469 float16x4_t __s0_257 = __p0_257; \ 44470 float16x4_t __s1_257 = __p1_257; \ 44471 float16x8_t __s2_257 = __p2_257; \ 44472 float16x4_t __rev0_257; __rev0_257 = __builtin_shufflevector(__s0_257, __s0_257, 3, 2, 1, 0); \ 44473 float16x4_t __rev1_257; __rev1_257 = __builtin_shufflevector(__s1_257, __s1_257, 3, 2, 1, 0); \ 44474 float16x8_t __rev2_257; __rev2_257 = __builtin_shufflevector(__s2_257, __s2_257, 7, 6, 5, 4, 3, 2, 1, 0); \ 44475 __ret_257 = __noswap_vfma_laneq_f16(__rev0_257, -__rev1_257, __rev2_257, __p3_257); \ 44476 __ret_257 = __builtin_shufflevector(__ret_257, __ret_257, 3, 2, 1, 0); \ 44477 __ret_257; \ 44478 }) 44479 #endif 44480 44481 #ifdef __LITTLE_ENDIAN__ 44482 #define vfmsq_n_f16(__p0, __p1, __p2) __extension__ ({ \ 44483 float16x8_t __ret; \ 44484 float16x8_t __s0 = __p0; \ 44485 float16x8_t __s1 = __p1; \ 44486 float16_t __s2 = __p2; \ 44487 __ret = vfmaq_f16(__s0, -__s1, (float16x8_t) {__s2, __s2, __s2, __s2, __s2, __s2, __s2, __s2}); \ 44488 __ret; \ 44489 }) 44490 #else 44491 #define vfmsq_n_f16(__p0, __p1, __p2) __extension__ ({ \ 44492 float16x8_t __ret; \ 44493 float16x8_t __s0 = __p0; \ 44494 float16x8_t __s1 = __p1; \ 44495 float16_t __s2 = __p2; \ 44496 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 44497 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 44498 __ret = __noswap_vfmaq_f16(__rev0, -__rev1, (float16x8_t) {__s2, __s2, __s2, __s2, __s2, __s2, __s2, __s2}); \ 44499 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 44500 __ret; \ 44501 }) 44502 #endif 44503 44504 #ifdef __LITTLE_ENDIAN__ 44505 #define vfms_n_f16(__p0, __p1, __p2) __extension__ ({ \ 44506 float16x4_t __ret; \ 44507 float16x4_t __s0 = __p0; \ 44508 float16x4_t __s1 = __p1; \ 44509 float16_t __s2 = __p2; \ 44510 __ret = vfma_f16(__s0, -__s1, (float16x4_t) {__s2, __s2, __s2, __s2}); \ 44511 __ret; \ 44512 }) 44513 #else 44514 #define vfms_n_f16(__p0, __p1, __p2) __extension__ ({ \ 44515 float16x4_t __ret; \ 44516 float16x4_t __s0 = __p0; \ 44517 float16x4_t __s1 = __p1; \ 44518 float16_t __s2 = __p2; \ 44519 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 44520 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 44521 __ret = __noswap_vfma_f16(__rev0, -__rev1, (float16x4_t) {__s2, __s2, __s2, __s2}); \ 44522 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 44523 __ret; \ 44524 }) 44525 #endif 44526 44527 #ifdef __LITTLE_ENDIAN__ 44528 #define vmaxnmvq_f16(__p0) __extension__ ({ \ 44529 float16_t __ret; \ 44530 float16x8_t __s0 = __p0; \ 44531 __ret = (float16_t) __builtin_neon_vmaxnmvq_f16((int8x16_t)__s0); \ 44532 __ret; \ 44533 }) 44534 #else 44535 #define vmaxnmvq_f16(__p0) __extension__ ({ \ 44536 float16_t __ret; \ 44537 float16x8_t __s0 = __p0; \ 44538 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 44539 __ret = (float16_t) __builtin_neon_vmaxnmvq_f16((int8x16_t)__rev0); \ 44540 __ret; \ 44541 }) 44542 #endif 44543 44544 #ifdef __LITTLE_ENDIAN__ 44545 #define vmaxnmv_f16(__p0) __extension__ ({ \ 44546 float16_t __ret; \ 44547 float16x4_t __s0 = __p0; \ 44548 __ret = (float16_t) __builtin_neon_vmaxnmv_f16((int8x8_t)__s0); \ 44549 __ret; \ 44550 }) 44551 #else 44552 #define vmaxnmv_f16(__p0) __extension__ ({ \ 44553 float16_t __ret; \ 44554 float16x4_t __s0 = __p0; \ 44555 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 44556 __ret = (float16_t) __builtin_neon_vmaxnmv_f16((int8x8_t)__rev0); \ 44557 __ret; \ 44558 }) 44559 #endif 44560 44561 #ifdef __LITTLE_ENDIAN__ 44562 #define vmaxvq_f16(__p0) __extension__ ({ \ 44563 float16_t __ret; \ 44564 float16x8_t __s0 = __p0; \ 44565 __ret = (float16_t) __builtin_neon_vmaxvq_f16((int8x16_t)__s0); \ 44566 __ret; \ 44567 }) 44568 #else 44569 #define vmaxvq_f16(__p0) __extension__ ({ \ 44570 float16_t __ret; \ 44571 float16x8_t __s0 = __p0; \ 44572 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 44573 __ret = (float16_t) __builtin_neon_vmaxvq_f16((int8x16_t)__rev0); \ 44574 __ret; \ 44575 }) 44576 #endif 44577 44578 #ifdef __LITTLE_ENDIAN__ 44579 #define vmaxv_f16(__p0) __extension__ ({ \ 44580 float16_t __ret; \ 44581 float16x4_t __s0 = __p0; \ 44582 __ret = (float16_t) __builtin_neon_vmaxv_f16((int8x8_t)__s0); \ 44583 __ret; \ 44584 }) 44585 #else 44586 #define vmaxv_f16(__p0) __extension__ ({ \ 44587 float16_t __ret; \ 44588 float16x4_t __s0 = __p0; \ 44589 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 44590 __ret = (float16_t) __builtin_neon_vmaxv_f16((int8x8_t)__rev0); \ 44591 __ret; \ 44592 }) 44593 #endif 44594 44595 #ifdef __LITTLE_ENDIAN__ 44596 #define vminnmvq_f16(__p0) __extension__ ({ \ 44597 float16_t __ret; \ 44598 float16x8_t __s0 = __p0; \ 44599 __ret = (float16_t) __builtin_neon_vminnmvq_f16((int8x16_t)__s0); \ 44600 __ret; \ 44601 }) 44602 #else 44603 #define vminnmvq_f16(__p0) __extension__ ({ \ 44604 float16_t __ret; \ 44605 float16x8_t __s0 = __p0; \ 44606 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 44607 __ret = (float16_t) __builtin_neon_vminnmvq_f16((int8x16_t)__rev0); \ 44608 __ret; \ 44609 }) 44610 #endif 44611 44612 #ifdef __LITTLE_ENDIAN__ 44613 #define vminnmv_f16(__p0) __extension__ ({ \ 44614 float16_t __ret; \ 44615 float16x4_t __s0 = __p0; \ 44616 __ret = (float16_t) __builtin_neon_vminnmv_f16((int8x8_t)__s0); \ 44617 __ret; \ 44618 }) 44619 #else 44620 #define vminnmv_f16(__p0) __extension__ ({ \ 44621 float16_t __ret; \ 44622 float16x4_t __s0 = __p0; \ 44623 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 44624 __ret = (float16_t) __builtin_neon_vminnmv_f16((int8x8_t)__rev0); \ 44625 __ret; \ 44626 }) 44627 #endif 44628 44629 #ifdef __LITTLE_ENDIAN__ 44630 #define vminvq_f16(__p0) __extension__ ({ \ 44631 float16_t __ret; \ 44632 float16x8_t __s0 = __p0; \ 44633 __ret = (float16_t) __builtin_neon_vminvq_f16((int8x16_t)__s0); \ 44634 __ret; \ 44635 }) 44636 #else 44637 #define vminvq_f16(__p0) __extension__ ({ \ 44638 float16_t __ret; \ 44639 float16x8_t __s0 = __p0; \ 44640 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 44641 __ret = (float16_t) __builtin_neon_vminvq_f16((int8x16_t)__rev0); \ 44642 __ret; \ 44643 }) 44644 #endif 44645 44646 #ifdef __LITTLE_ENDIAN__ 44647 #define vminv_f16(__p0) __extension__ ({ \ 44648 float16_t __ret; \ 44649 float16x4_t __s0 = __p0; \ 44650 __ret = (float16_t) __builtin_neon_vminv_f16((int8x8_t)__s0); \ 44651 __ret; \ 44652 }) 44653 #else 44654 #define vminv_f16(__p0) __extension__ ({ \ 44655 float16_t __ret; \ 44656 float16x4_t __s0 = __p0; \ 44657 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 44658 __ret = (float16_t) __builtin_neon_vminv_f16((int8x8_t)__rev0); \ 44659 __ret; \ 44660 }) 44661 #endif 44662 44663 #ifdef __LITTLE_ENDIAN__ 44664 #define vmulq_laneq_f16(__p0_258, __p1_258, __p2_258) __extension__ ({ \ 44665 float16x8_t __ret_258; \ 44666 float16x8_t __s0_258 = __p0_258; \ 44667 float16x8_t __s1_258 = __p1_258; \ 44668 __ret_258 = __s0_258 * splatq_laneq_f16(__s1_258, __p2_258); \ 44669 __ret_258; \ 44670 }) 44671 #else 44672 #define vmulq_laneq_f16(__p0_259, __p1_259, __p2_259) __extension__ ({ \ 44673 float16x8_t __ret_259; \ 44674 float16x8_t __s0_259 = __p0_259; \ 44675 float16x8_t __s1_259 = __p1_259; \ 44676 float16x8_t __rev0_259; __rev0_259 = __builtin_shufflevector(__s0_259, __s0_259, 7, 6, 5, 4, 3, 2, 1, 0); \ 44677 float16x8_t __rev1_259; __rev1_259 = __builtin_shufflevector(__s1_259, __s1_259, 7, 6, 5, 4, 3, 2, 1, 0); \ 44678 __ret_259 = __rev0_259 * __noswap_splatq_laneq_f16(__rev1_259, __p2_259); \ 44679 __ret_259 = __builtin_shufflevector(__ret_259, __ret_259, 7, 6, 5, 4, 3, 2, 1, 0); \ 44680 __ret_259; \ 44681 }) 44682 #endif 44683 44684 #ifdef __LITTLE_ENDIAN__ 44685 #define vmul_laneq_f16(__p0_260, __p1_260, __p2_260) __extension__ ({ \ 44686 float16x4_t __ret_260; \ 44687 float16x4_t __s0_260 = __p0_260; \ 44688 float16x8_t __s1_260 = __p1_260; \ 44689 __ret_260 = __s0_260 * splat_laneq_f16(__s1_260, __p2_260); \ 44690 __ret_260; \ 44691 }) 44692 #else 44693 #define vmul_laneq_f16(__p0_261, __p1_261, __p2_261) __extension__ ({ \ 44694 float16x4_t __ret_261; \ 44695 float16x4_t __s0_261 = __p0_261; \ 44696 float16x8_t __s1_261 = __p1_261; \ 44697 float16x4_t __rev0_261; __rev0_261 = __builtin_shufflevector(__s0_261, __s0_261, 3, 2, 1, 0); \ 44698 float16x8_t __rev1_261; __rev1_261 = __builtin_shufflevector(__s1_261, __s1_261, 7, 6, 5, 4, 3, 2, 1, 0); \ 44699 __ret_261 = __rev0_261 * __noswap_splat_laneq_f16(__rev1_261, __p2_261); \ 44700 __ret_261 = __builtin_shufflevector(__ret_261, __ret_261, 3, 2, 1, 0); \ 44701 __ret_261; \ 44702 }) 44703 #endif 44704 44705 #ifdef __LITTLE_ENDIAN__ 44706 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vmulxq_f16(float16x8_t __p0, float16x8_t __p1) { 44707 float16x8_t __ret; 44708 __ret = (float16x8_t) __builtin_neon_vmulxq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40); 44709 return __ret; 44710 } 44711 #else 44712 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vmulxq_f16(float16x8_t __p0, float16x8_t __p1) { 44713 float16x8_t __ret; 44714 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 44715 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 44716 __ret = (float16x8_t) __builtin_neon_vmulxq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40); 44717 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 44718 return __ret; 44719 } 44720 __ai __attribute__((target("fullfp16,neon"))) float16x8_t __noswap_vmulxq_f16(float16x8_t __p0, float16x8_t __p1) { 44721 float16x8_t __ret; 44722 __ret = (float16x8_t) __builtin_neon_vmulxq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40); 44723 return __ret; 44724 } 44725 #endif 44726 44727 #ifdef __LITTLE_ENDIAN__ 44728 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vmulx_f16(float16x4_t __p0, float16x4_t __p1) { 44729 float16x4_t __ret; 44730 __ret = (float16x4_t) __builtin_neon_vmulx_f16((int8x8_t)__p0, (int8x8_t)__p1, 8); 44731 return __ret; 44732 } 44733 #else 44734 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vmulx_f16(float16x4_t __p0, float16x4_t __p1) { 44735 float16x4_t __ret; 44736 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 44737 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 44738 __ret = (float16x4_t) __builtin_neon_vmulx_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8); 44739 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 44740 return __ret; 44741 } 44742 __ai __attribute__((target("fullfp16,neon"))) float16x4_t __noswap_vmulx_f16(float16x4_t __p0, float16x4_t __p1) { 44743 float16x4_t __ret; 44744 __ret = (float16x4_t) __builtin_neon_vmulx_f16((int8x8_t)__p0, (int8x8_t)__p1, 8); 44745 return __ret; 44746 } 44747 #endif 44748 44749 #ifdef __LITTLE_ENDIAN__ 44750 #define vmulxh_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 44751 float16_t __ret; \ 44752 float16_t __s0 = __p0; \ 44753 float16x4_t __s1 = __p1; \ 44754 __ret = (float16_t) __builtin_neon_vmulxh_lane_f16(__s0, (float16x4_t)__s1, __p2); \ 44755 __ret; \ 44756 }) 44757 #else 44758 #define vmulxh_lane_f16(__p0, __p1, __p2) __extension__ ({ \ 44759 float16_t __ret; \ 44760 float16_t __s0 = __p0; \ 44761 float16x4_t __s1 = __p1; \ 44762 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 44763 __ret = (float16_t) __builtin_neon_vmulxh_lane_f16(__s0, (float16x4_t)__rev1, __p2); \ 44764 __ret; \ 44765 }) 44766 #endif 44767 44768 #ifdef __LITTLE_ENDIAN__ 44769 #define vmulxq_lane_f16(__p0_262, __p1_262, __p2_262) __extension__ ({ \ 44770 float16x8_t __ret_262; \ 44771 float16x8_t __s0_262 = __p0_262; \ 44772 float16x4_t __s1_262 = __p1_262; \ 44773 __ret_262 = vmulxq_f16(__s0_262, splatq_lane_f16(__s1_262, __p2_262)); \ 44774 __ret_262; \ 44775 }) 44776 #else 44777 #define vmulxq_lane_f16(__p0_263, __p1_263, __p2_263) __extension__ ({ \ 44778 float16x8_t __ret_263; \ 44779 float16x8_t __s0_263 = __p0_263; \ 44780 float16x4_t __s1_263 = __p1_263; \ 44781 float16x8_t __rev0_263; __rev0_263 = __builtin_shufflevector(__s0_263, __s0_263, 7, 6, 5, 4, 3, 2, 1, 0); \ 44782 float16x4_t __rev1_263; __rev1_263 = __builtin_shufflevector(__s1_263, __s1_263, 3, 2, 1, 0); \ 44783 __ret_263 = __noswap_vmulxq_f16(__rev0_263, __noswap_splatq_lane_f16(__rev1_263, __p2_263)); \ 44784 __ret_263 = __builtin_shufflevector(__ret_263, __ret_263, 7, 6, 5, 4, 3, 2, 1, 0); \ 44785 __ret_263; \ 44786 }) 44787 #endif 44788 44789 #ifdef __LITTLE_ENDIAN__ 44790 #define vmulx_lane_f16(__p0_264, __p1_264, __p2_264) __extension__ ({ \ 44791 float16x4_t __ret_264; \ 44792 float16x4_t __s0_264 = __p0_264; \ 44793 float16x4_t __s1_264 = __p1_264; \ 44794 __ret_264 = vmulx_f16(__s0_264, splat_lane_f16(__s1_264, __p2_264)); \ 44795 __ret_264; \ 44796 }) 44797 #else 44798 #define vmulx_lane_f16(__p0_265, __p1_265, __p2_265) __extension__ ({ \ 44799 float16x4_t __ret_265; \ 44800 float16x4_t __s0_265 = __p0_265; \ 44801 float16x4_t __s1_265 = __p1_265; \ 44802 float16x4_t __rev0_265; __rev0_265 = __builtin_shufflevector(__s0_265, __s0_265, 3, 2, 1, 0); \ 44803 float16x4_t __rev1_265; __rev1_265 = __builtin_shufflevector(__s1_265, __s1_265, 3, 2, 1, 0); \ 44804 __ret_265 = __noswap_vmulx_f16(__rev0_265, __noswap_splat_lane_f16(__rev1_265, __p2_265)); \ 44805 __ret_265 = __builtin_shufflevector(__ret_265, __ret_265, 3, 2, 1, 0); \ 44806 __ret_265; \ 44807 }) 44808 #endif 44809 44810 #ifdef __LITTLE_ENDIAN__ 44811 #define vmulxh_laneq_f16(__p0, __p1, __p2) __extension__ ({ \ 44812 float16_t __ret; \ 44813 float16_t __s0 = __p0; \ 44814 float16x8_t __s1 = __p1; \ 44815 __ret = (float16_t) __builtin_neon_vmulxh_laneq_f16(__s0, (float16x8_t)__s1, __p2); \ 44816 __ret; \ 44817 }) 44818 #else 44819 #define vmulxh_laneq_f16(__p0, __p1, __p2) __extension__ ({ \ 44820 float16_t __ret; \ 44821 float16_t __s0 = __p0; \ 44822 float16x8_t __s1 = __p1; \ 44823 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 44824 __ret = (float16_t) __builtin_neon_vmulxh_laneq_f16(__s0, (float16x8_t)__rev1, __p2); \ 44825 __ret; \ 44826 }) 44827 #endif 44828 44829 #ifdef __LITTLE_ENDIAN__ 44830 #define vmulxq_laneq_f16(__p0_266, __p1_266, __p2_266) __extension__ ({ \ 44831 float16x8_t __ret_266; \ 44832 float16x8_t __s0_266 = __p0_266; \ 44833 float16x8_t __s1_266 = __p1_266; \ 44834 __ret_266 = vmulxq_f16(__s0_266, splatq_laneq_f16(__s1_266, __p2_266)); \ 44835 __ret_266; \ 44836 }) 44837 #else 44838 #define vmulxq_laneq_f16(__p0_267, __p1_267, __p2_267) __extension__ ({ \ 44839 float16x8_t __ret_267; \ 44840 float16x8_t __s0_267 = __p0_267; \ 44841 float16x8_t __s1_267 = __p1_267; \ 44842 float16x8_t __rev0_267; __rev0_267 = __builtin_shufflevector(__s0_267, __s0_267, 7, 6, 5, 4, 3, 2, 1, 0); \ 44843 float16x8_t __rev1_267; __rev1_267 = __builtin_shufflevector(__s1_267, __s1_267, 7, 6, 5, 4, 3, 2, 1, 0); \ 44844 __ret_267 = __noswap_vmulxq_f16(__rev0_267, __noswap_splatq_laneq_f16(__rev1_267, __p2_267)); \ 44845 __ret_267 = __builtin_shufflevector(__ret_267, __ret_267, 7, 6, 5, 4, 3, 2, 1, 0); \ 44846 __ret_267; \ 44847 }) 44848 #endif 44849 44850 #ifdef __LITTLE_ENDIAN__ 44851 #define vmulx_laneq_f16(__p0_268, __p1_268, __p2_268) __extension__ ({ \ 44852 float16x4_t __ret_268; \ 44853 float16x4_t __s0_268 = __p0_268; \ 44854 float16x8_t __s1_268 = __p1_268; \ 44855 __ret_268 = vmulx_f16(__s0_268, splat_laneq_f16(__s1_268, __p2_268)); \ 44856 __ret_268; \ 44857 }) 44858 #else 44859 #define vmulx_laneq_f16(__p0_269, __p1_269, __p2_269) __extension__ ({ \ 44860 float16x4_t __ret_269; \ 44861 float16x4_t __s0_269 = __p0_269; \ 44862 float16x8_t __s1_269 = __p1_269; \ 44863 float16x4_t __rev0_269; __rev0_269 = __builtin_shufflevector(__s0_269, __s0_269, 3, 2, 1, 0); \ 44864 float16x8_t __rev1_269; __rev1_269 = __builtin_shufflevector(__s1_269, __s1_269, 7, 6, 5, 4, 3, 2, 1, 0); \ 44865 __ret_269 = __noswap_vmulx_f16(__rev0_269, __noswap_splat_laneq_f16(__rev1_269, __p2_269)); \ 44866 __ret_269 = __builtin_shufflevector(__ret_269, __ret_269, 3, 2, 1, 0); \ 44867 __ret_269; \ 44868 }) 44869 #endif 44870 44871 #ifdef __LITTLE_ENDIAN__ 44872 #define vmulxq_n_f16(__p0, __p1) __extension__ ({ \ 44873 float16x8_t __ret; \ 44874 float16x8_t __s0 = __p0; \ 44875 float16_t __s1 = __p1; \ 44876 __ret = vmulxq_f16(__s0, (float16x8_t) {__s1, __s1, __s1, __s1, __s1, __s1, __s1, __s1}); \ 44877 __ret; \ 44878 }) 44879 #else 44880 #define vmulxq_n_f16(__p0, __p1) __extension__ ({ \ 44881 float16x8_t __ret; \ 44882 float16x8_t __s0 = __p0; \ 44883 float16_t __s1 = __p1; \ 44884 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 44885 __ret = __noswap_vmulxq_f16(__rev0, (float16x8_t) {__s1, __s1, __s1, __s1, __s1, __s1, __s1, __s1}); \ 44886 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 44887 __ret; \ 44888 }) 44889 #endif 44890 44891 #ifdef __LITTLE_ENDIAN__ 44892 #define vmulx_n_f16(__p0, __p1) __extension__ ({ \ 44893 float16x4_t __ret; \ 44894 float16x4_t __s0 = __p0; \ 44895 float16_t __s1 = __p1; \ 44896 __ret = vmulx_f16(__s0, (float16x4_t) {__s1, __s1, __s1, __s1}); \ 44897 __ret; \ 44898 }) 44899 #else 44900 #define vmulx_n_f16(__p0, __p1) __extension__ ({ \ 44901 float16x4_t __ret; \ 44902 float16x4_t __s0 = __p0; \ 44903 float16_t __s1 = __p1; \ 44904 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 44905 __ret = __noswap_vmulx_f16(__rev0, (float16x4_t) {__s1, __s1, __s1, __s1}); \ 44906 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 44907 __ret; \ 44908 }) 44909 #endif 44910 44911 #ifdef __LITTLE_ENDIAN__ 44912 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vpaddq_f16(float16x8_t __p0, float16x8_t __p1) { 44913 float16x8_t __ret; 44914 __ret = (float16x8_t) __builtin_neon_vpaddq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40); 44915 return __ret; 44916 } 44917 #else 44918 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vpaddq_f16(float16x8_t __p0, float16x8_t __p1) { 44919 float16x8_t __ret; 44920 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 44921 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 44922 __ret = (float16x8_t) __builtin_neon_vpaddq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40); 44923 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 44924 return __ret; 44925 } 44926 #endif 44927 44928 #ifdef __LITTLE_ENDIAN__ 44929 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vpmaxq_f16(float16x8_t __p0, float16x8_t __p1) { 44930 float16x8_t __ret; 44931 __ret = (float16x8_t) __builtin_neon_vpmaxq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40); 44932 return __ret; 44933 } 44934 #else 44935 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vpmaxq_f16(float16x8_t __p0, float16x8_t __p1) { 44936 float16x8_t __ret; 44937 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 44938 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 44939 __ret = (float16x8_t) __builtin_neon_vpmaxq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40); 44940 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 44941 return __ret; 44942 } 44943 #endif 44944 44945 #ifdef __LITTLE_ENDIAN__ 44946 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vpmaxnmq_f16(float16x8_t __p0, float16x8_t __p1) { 44947 float16x8_t __ret; 44948 __ret = (float16x8_t) __builtin_neon_vpmaxnmq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40); 44949 return __ret; 44950 } 44951 #else 44952 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vpmaxnmq_f16(float16x8_t __p0, float16x8_t __p1) { 44953 float16x8_t __ret; 44954 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 44955 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 44956 __ret = (float16x8_t) __builtin_neon_vpmaxnmq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40); 44957 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 44958 return __ret; 44959 } 44960 #endif 44961 44962 #ifdef __LITTLE_ENDIAN__ 44963 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vpmaxnm_f16(float16x4_t __p0, float16x4_t __p1) { 44964 float16x4_t __ret; 44965 __ret = (float16x4_t) __builtin_neon_vpmaxnm_f16((int8x8_t)__p0, (int8x8_t)__p1, 8); 44966 return __ret; 44967 } 44968 #else 44969 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vpmaxnm_f16(float16x4_t __p0, float16x4_t __p1) { 44970 float16x4_t __ret; 44971 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 44972 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 44973 __ret = (float16x4_t) __builtin_neon_vpmaxnm_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8); 44974 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 44975 return __ret; 44976 } 44977 #endif 44978 44979 #ifdef __LITTLE_ENDIAN__ 44980 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vpminq_f16(float16x8_t __p0, float16x8_t __p1) { 44981 float16x8_t __ret; 44982 __ret = (float16x8_t) __builtin_neon_vpminq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40); 44983 return __ret; 44984 } 44985 #else 44986 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vpminq_f16(float16x8_t __p0, float16x8_t __p1) { 44987 float16x8_t __ret; 44988 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 44989 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 44990 __ret = (float16x8_t) __builtin_neon_vpminq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40); 44991 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 44992 return __ret; 44993 } 44994 #endif 44995 44996 #ifdef __LITTLE_ENDIAN__ 44997 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vpminnmq_f16(float16x8_t __p0, float16x8_t __p1) { 44998 float16x8_t __ret; 44999 __ret = (float16x8_t) __builtin_neon_vpminnmq_f16((int8x16_t)__p0, (int8x16_t)__p1, 40); 45000 return __ret; 45001 } 45002 #else 45003 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vpminnmq_f16(float16x8_t __p0, float16x8_t __p1) { 45004 float16x8_t __ret; 45005 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 45006 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 45007 __ret = (float16x8_t) __builtin_neon_vpminnmq_f16((int8x16_t)__rev0, (int8x16_t)__rev1, 40); 45008 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 45009 return __ret; 45010 } 45011 #endif 45012 45013 #ifdef __LITTLE_ENDIAN__ 45014 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vpminnm_f16(float16x4_t __p0, float16x4_t __p1) { 45015 float16x4_t __ret; 45016 __ret = (float16x4_t) __builtin_neon_vpminnm_f16((int8x8_t)__p0, (int8x8_t)__p1, 8); 45017 return __ret; 45018 } 45019 #else 45020 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vpminnm_f16(float16x4_t __p0, float16x4_t __p1) { 45021 float16x4_t __ret; 45022 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 45023 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 45024 __ret = (float16x4_t) __builtin_neon_vpminnm_f16((int8x8_t)__rev0, (int8x8_t)__rev1, 8); 45025 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 45026 return __ret; 45027 } 45028 #endif 45029 45030 #ifdef __LITTLE_ENDIAN__ 45031 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrndiq_f16(float16x8_t __p0) { 45032 float16x8_t __ret; 45033 __ret = (float16x8_t) __builtin_neon_vrndiq_f16((int8x16_t)__p0, 40); 45034 return __ret; 45035 } 45036 #else 45037 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vrndiq_f16(float16x8_t __p0) { 45038 float16x8_t __ret; 45039 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 45040 __ret = (float16x8_t) __builtin_neon_vrndiq_f16((int8x16_t)__rev0, 40); 45041 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 45042 return __ret; 45043 } 45044 #endif 45045 45046 #ifdef __LITTLE_ENDIAN__ 45047 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrndi_f16(float16x4_t __p0) { 45048 float16x4_t __ret; 45049 __ret = (float16x4_t) __builtin_neon_vrndi_f16((int8x8_t)__p0, 8); 45050 return __ret; 45051 } 45052 #else 45053 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vrndi_f16(float16x4_t __p0) { 45054 float16x4_t __ret; 45055 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 45056 __ret = (float16x4_t) __builtin_neon_vrndi_f16((int8x8_t)__rev0, 8); 45057 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 45058 return __ret; 45059 } 45060 #endif 45061 45062 #ifdef __LITTLE_ENDIAN__ 45063 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vsqrtq_f16(float16x8_t __p0) { 45064 float16x8_t __ret; 45065 __ret = (float16x8_t) __builtin_neon_vsqrtq_f16((int8x16_t)__p0, 40); 45066 return __ret; 45067 } 45068 #else 45069 __ai __attribute__((target("fullfp16,neon"))) float16x8_t vsqrtq_f16(float16x8_t __p0) { 45070 float16x8_t __ret; 45071 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 45072 __ret = (float16x8_t) __builtin_neon_vsqrtq_f16((int8x16_t)__rev0, 40); 45073 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 45074 return __ret; 45075 } 45076 #endif 45077 45078 #ifdef __LITTLE_ENDIAN__ 45079 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vsqrt_f16(float16x4_t __p0) { 45080 float16x4_t __ret; 45081 __ret = (float16x4_t) __builtin_neon_vsqrt_f16((int8x8_t)__p0, 8); 45082 return __ret; 45083 } 45084 #else 45085 __ai __attribute__((target("fullfp16,neon"))) float16x4_t vsqrt_f16(float16x4_t __p0) { 45086 float16x4_t __ret; 45087 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 45088 __ret = (float16x4_t) __builtin_neon_vsqrt_f16((int8x8_t)__rev0, 8); 45089 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 45090 return __ret; 45091 } 45092 #endif 45093 45094 #ifdef __LITTLE_ENDIAN__ 45095 #define vsudotq_laneq_s32(__p0_270, __p1_270, __p2_270, __p3_270) __extension__ ({ \ 45096 int32x4_t __ret_270; \ 45097 int32x4_t __s0_270 = __p0_270; \ 45098 int8x16_t __s1_270 = __p1_270; \ 45099 uint8x16_t __s2_270 = __p2_270; \ 45100 __ret_270 = vusdotq_s32(__s0_270, (uint8x16_t)(splatq_laneq_s32(__builtin_bit_cast(int32x4_t, __s2_270), __p3_270)), __s1_270); \ 45101 __ret_270; \ 45102 }) 45103 #else 45104 #define vsudotq_laneq_s32(__p0_271, __p1_271, __p2_271, __p3_271) __extension__ ({ \ 45105 int32x4_t __ret_271; \ 45106 int32x4_t __s0_271 = __p0_271; \ 45107 int8x16_t __s1_271 = __p1_271; \ 45108 uint8x16_t __s2_271 = __p2_271; \ 45109 int32x4_t __rev0_271; __rev0_271 = __builtin_shufflevector(__s0_271, __s0_271, 3, 2, 1, 0); \ 45110 int8x16_t __rev1_271; __rev1_271 = __builtin_shufflevector(__s1_271, __s1_271, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 45111 uint8x16_t __rev2_271; __rev2_271 = __builtin_shufflevector(__s2_271, __s2_271, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 45112 __ret_271 = __noswap_vusdotq_s32(__rev0_271, (uint8x16_t)(__noswap_splatq_laneq_s32(__builtin_bit_cast(int32x4_t, __rev2_271), __p3_271)), __rev1_271); \ 45113 __ret_271 = __builtin_shufflevector(__ret_271, __ret_271, 3, 2, 1, 0); \ 45114 __ret_271; \ 45115 }) 45116 #endif 45117 45118 #ifdef __LITTLE_ENDIAN__ 45119 #define vsudot_laneq_s32(__p0_272, __p1_272, __p2_272, __p3_272) __extension__ ({ \ 45120 int32x2_t __ret_272; \ 45121 int32x2_t __s0_272 = __p0_272; \ 45122 int8x8_t __s1_272 = __p1_272; \ 45123 uint8x16_t __s2_272 = __p2_272; \ 45124 __ret_272 = vusdot_s32(__s0_272, (uint8x8_t)(splat_laneq_s32(__builtin_bit_cast(int32x4_t, __s2_272), __p3_272)), __s1_272); \ 45125 __ret_272; \ 45126 }) 45127 #else 45128 #define vsudot_laneq_s32(__p0_273, __p1_273, __p2_273, __p3_273) __extension__ ({ \ 45129 int32x2_t __ret_273; \ 45130 int32x2_t __s0_273 = __p0_273; \ 45131 int8x8_t __s1_273 = __p1_273; \ 45132 uint8x16_t __s2_273 = __p2_273; \ 45133 int32x2_t __rev0_273; __rev0_273 = __builtin_shufflevector(__s0_273, __s0_273, 1, 0); \ 45134 int8x8_t __rev1_273; __rev1_273 = __builtin_shufflevector(__s1_273, __s1_273, 7, 6, 5, 4, 3, 2, 1, 0); \ 45135 uint8x16_t __rev2_273; __rev2_273 = __builtin_shufflevector(__s2_273, __s2_273, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 45136 __ret_273 = __noswap_vusdot_s32(__rev0_273, (uint8x8_t)(__noswap_splat_laneq_s32(__builtin_bit_cast(int32x4_t, __rev2_273), __p3_273)), __rev1_273); \ 45137 __ret_273 = __builtin_shufflevector(__ret_273, __ret_273, 1, 0); \ 45138 __ret_273; \ 45139 }) 45140 #endif 45141 45142 #ifdef __LITTLE_ENDIAN__ 45143 #define vusdotq_laneq_s32(__p0_274, __p1_274, __p2_274, __p3_274) __extension__ ({ \ 45144 int32x4_t __ret_274; \ 45145 int32x4_t __s0_274 = __p0_274; \ 45146 uint8x16_t __s1_274 = __p1_274; \ 45147 int8x16_t __s2_274 = __p2_274; \ 45148 __ret_274 = vusdotq_s32(__s0_274, __s1_274, (int8x16_t)(splatq_laneq_s32(__builtin_bit_cast(int32x4_t, __s2_274), __p3_274))); \ 45149 __ret_274; \ 45150 }) 45151 #else 45152 #define vusdotq_laneq_s32(__p0_275, __p1_275, __p2_275, __p3_275) __extension__ ({ \ 45153 int32x4_t __ret_275; \ 45154 int32x4_t __s0_275 = __p0_275; \ 45155 uint8x16_t __s1_275 = __p1_275; \ 45156 int8x16_t __s2_275 = __p2_275; \ 45157 int32x4_t __rev0_275; __rev0_275 = __builtin_shufflevector(__s0_275, __s0_275, 3, 2, 1, 0); \ 45158 uint8x16_t __rev1_275; __rev1_275 = __builtin_shufflevector(__s1_275, __s1_275, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 45159 int8x16_t __rev2_275; __rev2_275 = __builtin_shufflevector(__s2_275, __s2_275, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 45160 __ret_275 = __noswap_vusdotq_s32(__rev0_275, __rev1_275, (int8x16_t)(__noswap_splatq_laneq_s32(__builtin_bit_cast(int32x4_t, __rev2_275), __p3_275))); \ 45161 __ret_275 = __builtin_shufflevector(__ret_275, __ret_275, 3, 2, 1, 0); \ 45162 __ret_275; \ 45163 }) 45164 #endif 45165 45166 #ifdef __LITTLE_ENDIAN__ 45167 #define vusdot_laneq_s32(__p0_276, __p1_276, __p2_276, __p3_276) __extension__ ({ \ 45168 int32x2_t __ret_276; \ 45169 int32x2_t __s0_276 = __p0_276; \ 45170 uint8x8_t __s1_276 = __p1_276; \ 45171 int8x16_t __s2_276 = __p2_276; \ 45172 __ret_276 = vusdot_s32(__s0_276, __s1_276, (int8x8_t)(splat_laneq_s32(__builtin_bit_cast(int32x4_t, __s2_276), __p3_276))); \ 45173 __ret_276; \ 45174 }) 45175 #else 45176 #define vusdot_laneq_s32(__p0_277, __p1_277, __p2_277, __p3_277) __extension__ ({ \ 45177 int32x2_t __ret_277; \ 45178 int32x2_t __s0_277 = __p0_277; \ 45179 uint8x8_t __s1_277 = __p1_277; \ 45180 int8x16_t __s2_277 = __p2_277; \ 45181 int32x2_t __rev0_277; __rev0_277 = __builtin_shufflevector(__s0_277, __s0_277, 1, 0); \ 45182 uint8x8_t __rev1_277; __rev1_277 = __builtin_shufflevector(__s1_277, __s1_277, 7, 6, 5, 4, 3, 2, 1, 0); \ 45183 int8x16_t __rev2_277; __rev2_277 = __builtin_shufflevector(__s2_277, __s2_277, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 45184 __ret_277 = __noswap_vusdot_s32(__rev0_277, __rev1_277, (int8x8_t)(__noswap_splat_laneq_s32(__builtin_bit_cast(int32x4_t, __rev2_277), __p3_277))); \ 45185 __ret_277 = __builtin_shufflevector(__ret_277, __ret_277, 1, 0); \ 45186 __ret_277; \ 45187 }) 45188 #endif 45189 45190 #ifdef __LITTLE_ENDIAN__ 45191 __ai __attribute__((target("neon"))) float64x2_t vabdq_f64(float64x2_t __p0, float64x2_t __p1) { 45192 float64x2_t __ret; 45193 __ret = (float64x2_t) __builtin_neon_vabdq_v((int8x16_t)__p0, (int8x16_t)__p1, 42); 45194 return __ret; 45195 } 45196 #else 45197 __ai __attribute__((target("neon"))) float64x2_t vabdq_f64(float64x2_t __p0, float64x2_t __p1) { 45198 float64x2_t __ret; 45199 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 45200 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 45201 __ret = (float64x2_t) __builtin_neon_vabdq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 42); 45202 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 45203 return __ret; 45204 } 45205 #endif 45206 45207 __ai __attribute__((target("neon"))) float64x1_t vabd_f64(float64x1_t __p0, float64x1_t __p1) { 45208 float64x1_t __ret; 45209 __ret = (float64x1_t) __builtin_neon_vabd_v((int8x8_t)__p0, (int8x8_t)__p1, 10); 45210 return __ret; 45211 } 45212 __ai __attribute__((target("neon"))) float64_t vabdd_f64(float64_t __p0, float64_t __p1) { 45213 float64_t __ret; 45214 __ret = (float64_t) __builtin_neon_vabdd_f64(__p0, __p1); 45215 return __ret; 45216 } 45217 __ai __attribute__((target("neon"))) float32_t vabds_f32(float32_t __p0, float32_t __p1) { 45218 float32_t __ret; 45219 __ret = (float32_t) __builtin_neon_vabds_f32(__p0, __p1); 45220 return __ret; 45221 } 45222 #ifdef __LITTLE_ENDIAN__ 45223 __ai __attribute__((target("neon"))) float64x2_t vabsq_f64(float64x2_t __p0) { 45224 float64x2_t __ret; 45225 __ret = (float64x2_t) __builtin_neon_vabsq_v((int8x16_t)__p0, 42); 45226 return __ret; 45227 } 45228 #else 45229 __ai __attribute__((target("neon"))) float64x2_t vabsq_f64(float64x2_t __p0) { 45230 float64x2_t __ret; 45231 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 45232 __ret = (float64x2_t) __builtin_neon_vabsq_v((int8x16_t)__rev0, 42); 45233 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 45234 return __ret; 45235 } 45236 #endif 45237 45238 #ifdef __LITTLE_ENDIAN__ 45239 __ai __attribute__((target("neon"))) int64x2_t vabsq_s64(int64x2_t __p0) { 45240 int64x2_t __ret; 45241 __ret = (int64x2_t) __builtin_neon_vabsq_v((int8x16_t)__p0, 35); 45242 return __ret; 45243 } 45244 #else 45245 __ai __attribute__((target("neon"))) int64x2_t vabsq_s64(int64x2_t __p0) { 45246 int64x2_t __ret; 45247 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 45248 __ret = (int64x2_t) __builtin_neon_vabsq_v((int8x16_t)__rev0, 35); 45249 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 45250 return __ret; 45251 } 45252 #endif 45253 45254 __ai __attribute__((target("neon"))) float64x1_t vabs_f64(float64x1_t __p0) { 45255 float64x1_t __ret; 45256 __ret = (float64x1_t) __builtin_neon_vabs_v((int8x8_t)__p0, 10); 45257 return __ret; 45258 } 45259 __ai __attribute__((target("neon"))) int64x1_t vabs_s64(int64x1_t __p0) { 45260 int64x1_t __ret; 45261 __ret = (int64x1_t) __builtin_neon_vabs_v((int8x8_t)__p0, 3); 45262 return __ret; 45263 } 45264 __ai __attribute__((target("neon"))) int64_t vabsd_s64(int64_t __p0) { 45265 int64_t __ret; 45266 __ret = (int64_t) __builtin_neon_vabsd_s64(__p0); 45267 return __ret; 45268 } 45269 #ifdef __LITTLE_ENDIAN__ 45270 __ai __attribute__((target("neon"))) float64x2_t vaddq_f64(float64x2_t __p0, float64x2_t __p1) { 45271 float64x2_t __ret; 45272 __ret = __p0 + __p1; 45273 return __ret; 45274 } 45275 #else 45276 __ai __attribute__((target("neon"))) float64x2_t vaddq_f64(float64x2_t __p0, float64x2_t __p1) { 45277 float64x2_t __ret; 45278 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 45279 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 45280 __ret = __rev0 + __rev1; 45281 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 45282 return __ret; 45283 } 45284 #endif 45285 45286 __ai __attribute__((target("neon"))) float64x1_t vadd_f64(float64x1_t __p0, float64x1_t __p1) { 45287 float64x1_t __ret; 45288 __ret = __p0 + __p1; 45289 return __ret; 45290 } 45291 __ai __attribute__((target("neon"))) uint64_t vaddd_u64(uint64_t __p0, uint64_t __p1) { 45292 uint64_t __ret; 45293 __ret = (uint64_t) __builtin_neon_vaddd_u64(__p0, __p1); 45294 return __ret; 45295 } 45296 __ai __attribute__((target("neon"))) int64_t vaddd_s64(int64_t __p0, int64_t __p1) { 45297 int64_t __ret; 45298 __ret = (int64_t) __builtin_neon_vaddd_s64(__p0, __p1); 45299 return __ret; 45300 } 45301 __ai __attribute__((target("neon"))) poly128_t vaddq_p128(poly128_t __p0, poly128_t __p1) { 45302 poly128_t __ret; 45303 __ret = (poly128_t) __builtin_neon_vaddq_p128(__p0, __p1); 45304 return __ret; 45305 } 45306 #ifdef __LITTLE_ENDIAN__ 45307 __ai __attribute__((target("neon"))) uint16x8_t vaddhn_high_u32(uint16x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 45308 uint16x8_t __ret; 45309 __ret = vcombine_u16(__p0, vaddhn_u32(__p1, __p2)); 45310 return __ret; 45311 } 45312 #else 45313 __ai __attribute__((target("neon"))) uint16x8_t vaddhn_high_u32(uint16x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 45314 uint16x8_t __ret; 45315 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 45316 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 45317 uint32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 45318 __ret = __noswap_vcombine_u16(__rev0, __noswap_vaddhn_u32(__rev1, __rev2)); 45319 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 45320 return __ret; 45321 } 45322 #endif 45323 45324 #ifdef __LITTLE_ENDIAN__ 45325 __ai __attribute__((target("neon"))) uint32x4_t vaddhn_high_u64(uint32x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) { 45326 uint32x4_t __ret; 45327 __ret = vcombine_u32(__p0, vaddhn_u64(__p1, __p2)); 45328 return __ret; 45329 } 45330 #else 45331 __ai __attribute__((target("neon"))) uint32x4_t vaddhn_high_u64(uint32x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) { 45332 uint32x4_t __ret; 45333 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 45334 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 45335 uint64x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 45336 __ret = __noswap_vcombine_u32(__rev0, __noswap_vaddhn_u64(__rev1, __rev2)); 45337 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 45338 return __ret; 45339 } 45340 #endif 45341 45342 #ifdef __LITTLE_ENDIAN__ 45343 __ai __attribute__((target("neon"))) uint8x16_t vaddhn_high_u16(uint8x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) { 45344 uint8x16_t __ret; 45345 __ret = vcombine_u8(__p0, vaddhn_u16(__p1, __p2)); 45346 return __ret; 45347 } 45348 #else 45349 __ai __attribute__((target("neon"))) uint8x16_t vaddhn_high_u16(uint8x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) { 45350 uint8x16_t __ret; 45351 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 45352 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 45353 uint16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 45354 __ret = __noswap_vcombine_u8(__rev0, __noswap_vaddhn_u16(__rev1, __rev2)); 45355 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 45356 return __ret; 45357 } 45358 #endif 45359 45360 #ifdef __LITTLE_ENDIAN__ 45361 __ai __attribute__((target("neon"))) int16x8_t vaddhn_high_s32(int16x4_t __p0, int32x4_t __p1, int32x4_t __p2) { 45362 int16x8_t __ret; 45363 __ret = vcombine_s16(__p0, vaddhn_s32(__p1, __p2)); 45364 return __ret; 45365 } 45366 #else 45367 __ai __attribute__((target("neon"))) int16x8_t vaddhn_high_s32(int16x4_t __p0, int32x4_t __p1, int32x4_t __p2) { 45368 int16x8_t __ret; 45369 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 45370 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 45371 int32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 45372 __ret = __noswap_vcombine_s16(__rev0, __noswap_vaddhn_s32(__rev1, __rev2)); 45373 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 45374 return __ret; 45375 } 45376 #endif 45377 45378 #ifdef __LITTLE_ENDIAN__ 45379 __ai __attribute__((target("neon"))) int32x4_t vaddhn_high_s64(int32x2_t __p0, int64x2_t __p1, int64x2_t __p2) { 45380 int32x4_t __ret; 45381 __ret = vcombine_s32(__p0, vaddhn_s64(__p1, __p2)); 45382 return __ret; 45383 } 45384 #else 45385 __ai __attribute__((target("neon"))) int32x4_t vaddhn_high_s64(int32x2_t __p0, int64x2_t __p1, int64x2_t __p2) { 45386 int32x4_t __ret; 45387 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 45388 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 45389 int64x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 45390 __ret = __noswap_vcombine_s32(__rev0, __noswap_vaddhn_s64(__rev1, __rev2)); 45391 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 45392 return __ret; 45393 } 45394 #endif 45395 45396 #ifdef __LITTLE_ENDIAN__ 45397 __ai __attribute__((target("neon"))) int8x16_t vaddhn_high_s16(int8x8_t __p0, int16x8_t __p1, int16x8_t __p2) { 45398 int8x16_t __ret; 45399 __ret = vcombine_s8(__p0, vaddhn_s16(__p1, __p2)); 45400 return __ret; 45401 } 45402 #else 45403 __ai __attribute__((target("neon"))) int8x16_t vaddhn_high_s16(int8x8_t __p0, int16x8_t __p1, int16x8_t __p2) { 45404 int8x16_t __ret; 45405 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 45406 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 45407 int16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 45408 __ret = __noswap_vcombine_s8(__rev0, __noswap_vaddhn_s16(__rev1, __rev2)); 45409 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 45410 return __ret; 45411 } 45412 #endif 45413 45414 #ifdef __LITTLE_ENDIAN__ 45415 __ai __attribute__((target("neon"))) uint16_t vaddlvq_u8(uint8x16_t __p0) { 45416 uint16_t __ret; 45417 __ret = (uint16_t) __builtin_neon_vaddlvq_u8(__p0); 45418 return __ret; 45419 } 45420 #else 45421 __ai __attribute__((target("neon"))) uint16_t vaddlvq_u8(uint8x16_t __p0) { 45422 uint16_t __ret; 45423 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 45424 __ret = (uint16_t) __builtin_neon_vaddlvq_u8(__rev0); 45425 return __ret; 45426 } 45427 #endif 45428 45429 #ifdef __LITTLE_ENDIAN__ 45430 __ai __attribute__((target("neon"))) uint64_t vaddlvq_u32(uint32x4_t __p0) { 45431 uint64_t __ret; 45432 __ret = (uint64_t) __builtin_neon_vaddlvq_u32(__p0); 45433 return __ret; 45434 } 45435 #else 45436 __ai __attribute__((target("neon"))) uint64_t vaddlvq_u32(uint32x4_t __p0) { 45437 uint64_t __ret; 45438 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 45439 __ret = (uint64_t) __builtin_neon_vaddlvq_u32(__rev0); 45440 return __ret; 45441 } 45442 #endif 45443 45444 #ifdef __LITTLE_ENDIAN__ 45445 __ai __attribute__((target("neon"))) uint32_t vaddlvq_u16(uint16x8_t __p0) { 45446 uint32_t __ret; 45447 __ret = (uint32_t) __builtin_neon_vaddlvq_u16(__p0); 45448 return __ret; 45449 } 45450 #else 45451 __ai __attribute__((target("neon"))) uint32_t vaddlvq_u16(uint16x8_t __p0) { 45452 uint32_t __ret; 45453 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 45454 __ret = (uint32_t) __builtin_neon_vaddlvq_u16(__rev0); 45455 return __ret; 45456 } 45457 #endif 45458 45459 #ifdef __LITTLE_ENDIAN__ 45460 __ai __attribute__((target("neon"))) int16_t vaddlvq_s8(int8x16_t __p0) { 45461 int16_t __ret; 45462 __ret = (int16_t) __builtin_neon_vaddlvq_s8(__p0); 45463 return __ret; 45464 } 45465 #else 45466 __ai __attribute__((target("neon"))) int16_t vaddlvq_s8(int8x16_t __p0) { 45467 int16_t __ret; 45468 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 45469 __ret = (int16_t) __builtin_neon_vaddlvq_s8(__rev0); 45470 return __ret; 45471 } 45472 #endif 45473 45474 #ifdef __LITTLE_ENDIAN__ 45475 __ai __attribute__((target("neon"))) int64_t vaddlvq_s32(int32x4_t __p0) { 45476 int64_t __ret; 45477 __ret = (int64_t) __builtin_neon_vaddlvq_s32(__p0); 45478 return __ret; 45479 } 45480 #else 45481 __ai __attribute__((target("neon"))) int64_t vaddlvq_s32(int32x4_t __p0) { 45482 int64_t __ret; 45483 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 45484 __ret = (int64_t) __builtin_neon_vaddlvq_s32(__rev0); 45485 return __ret; 45486 } 45487 #endif 45488 45489 #ifdef __LITTLE_ENDIAN__ 45490 __ai __attribute__((target("neon"))) int32_t vaddlvq_s16(int16x8_t __p0) { 45491 int32_t __ret; 45492 __ret = (int32_t) __builtin_neon_vaddlvq_s16(__p0); 45493 return __ret; 45494 } 45495 #else 45496 __ai __attribute__((target("neon"))) int32_t vaddlvq_s16(int16x8_t __p0) { 45497 int32_t __ret; 45498 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 45499 __ret = (int32_t) __builtin_neon_vaddlvq_s16(__rev0); 45500 return __ret; 45501 } 45502 #endif 45503 45504 #ifdef __LITTLE_ENDIAN__ 45505 __ai __attribute__((target("neon"))) uint16_t vaddlv_u8(uint8x8_t __p0) { 45506 uint16_t __ret; 45507 __ret = (uint16_t) __builtin_neon_vaddlv_u8(__p0); 45508 return __ret; 45509 } 45510 #else 45511 __ai __attribute__((target("neon"))) uint16_t vaddlv_u8(uint8x8_t __p0) { 45512 uint16_t __ret; 45513 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 45514 __ret = (uint16_t) __builtin_neon_vaddlv_u8(__rev0); 45515 return __ret; 45516 } 45517 #endif 45518 45519 #ifdef __LITTLE_ENDIAN__ 45520 __ai __attribute__((target("neon"))) uint64_t vaddlv_u32(uint32x2_t __p0) { 45521 uint64_t __ret; 45522 __ret = (uint64_t) __builtin_neon_vaddlv_u32(__p0); 45523 return __ret; 45524 } 45525 #else 45526 __ai __attribute__((target("neon"))) uint64_t vaddlv_u32(uint32x2_t __p0) { 45527 uint64_t __ret; 45528 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 45529 __ret = (uint64_t) __builtin_neon_vaddlv_u32(__rev0); 45530 return __ret; 45531 } 45532 #endif 45533 45534 #ifdef __LITTLE_ENDIAN__ 45535 __ai __attribute__((target("neon"))) uint32_t vaddlv_u16(uint16x4_t __p0) { 45536 uint32_t __ret; 45537 __ret = (uint32_t) __builtin_neon_vaddlv_u16(__p0); 45538 return __ret; 45539 } 45540 #else 45541 __ai __attribute__((target("neon"))) uint32_t vaddlv_u16(uint16x4_t __p0) { 45542 uint32_t __ret; 45543 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 45544 __ret = (uint32_t) __builtin_neon_vaddlv_u16(__rev0); 45545 return __ret; 45546 } 45547 #endif 45548 45549 #ifdef __LITTLE_ENDIAN__ 45550 __ai __attribute__((target("neon"))) int16_t vaddlv_s8(int8x8_t __p0) { 45551 int16_t __ret; 45552 __ret = (int16_t) __builtin_neon_vaddlv_s8(__p0); 45553 return __ret; 45554 } 45555 #else 45556 __ai __attribute__((target("neon"))) int16_t vaddlv_s8(int8x8_t __p0) { 45557 int16_t __ret; 45558 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 45559 __ret = (int16_t) __builtin_neon_vaddlv_s8(__rev0); 45560 return __ret; 45561 } 45562 #endif 45563 45564 #ifdef __LITTLE_ENDIAN__ 45565 __ai __attribute__((target("neon"))) int64_t vaddlv_s32(int32x2_t __p0) { 45566 int64_t __ret; 45567 __ret = (int64_t) __builtin_neon_vaddlv_s32(__p0); 45568 return __ret; 45569 } 45570 #else 45571 __ai __attribute__((target("neon"))) int64_t vaddlv_s32(int32x2_t __p0) { 45572 int64_t __ret; 45573 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 45574 __ret = (int64_t) __builtin_neon_vaddlv_s32(__rev0); 45575 return __ret; 45576 } 45577 #endif 45578 45579 #ifdef __LITTLE_ENDIAN__ 45580 __ai __attribute__((target("neon"))) int32_t vaddlv_s16(int16x4_t __p0) { 45581 int32_t __ret; 45582 __ret = (int32_t) __builtin_neon_vaddlv_s16(__p0); 45583 return __ret; 45584 } 45585 #else 45586 __ai __attribute__((target("neon"))) int32_t vaddlv_s16(int16x4_t __p0) { 45587 int32_t __ret; 45588 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 45589 __ret = (int32_t) __builtin_neon_vaddlv_s16(__rev0); 45590 return __ret; 45591 } 45592 #endif 45593 45594 #ifdef __LITTLE_ENDIAN__ 45595 __ai __attribute__((target("neon"))) uint8_t vaddvq_u8(uint8x16_t __p0) { 45596 uint8_t __ret; 45597 __ret = (uint8_t) __builtin_neon_vaddvq_u8(__p0); 45598 return __ret; 45599 } 45600 #else 45601 __ai __attribute__((target("neon"))) uint8_t vaddvq_u8(uint8x16_t __p0) { 45602 uint8_t __ret; 45603 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 45604 __ret = (uint8_t) __builtin_neon_vaddvq_u8(__rev0); 45605 return __ret; 45606 } 45607 #endif 45608 45609 #ifdef __LITTLE_ENDIAN__ 45610 __ai __attribute__((target("neon"))) uint32_t vaddvq_u32(uint32x4_t __p0) { 45611 uint32_t __ret; 45612 __ret = (uint32_t) __builtin_neon_vaddvq_u32(__p0); 45613 return __ret; 45614 } 45615 #else 45616 __ai __attribute__((target("neon"))) uint32_t vaddvq_u32(uint32x4_t __p0) { 45617 uint32_t __ret; 45618 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 45619 __ret = (uint32_t) __builtin_neon_vaddvq_u32(__rev0); 45620 return __ret; 45621 } 45622 #endif 45623 45624 #ifdef __LITTLE_ENDIAN__ 45625 __ai __attribute__((target("neon"))) uint64_t vaddvq_u64(uint64x2_t __p0) { 45626 uint64_t __ret; 45627 __ret = (uint64_t) __builtin_neon_vaddvq_u64(__p0); 45628 return __ret; 45629 } 45630 #else 45631 __ai __attribute__((target("neon"))) uint64_t vaddvq_u64(uint64x2_t __p0) { 45632 uint64_t __ret; 45633 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 45634 __ret = (uint64_t) __builtin_neon_vaddvq_u64(__rev0); 45635 return __ret; 45636 } 45637 #endif 45638 45639 #ifdef __LITTLE_ENDIAN__ 45640 __ai __attribute__((target("neon"))) uint16_t vaddvq_u16(uint16x8_t __p0) { 45641 uint16_t __ret; 45642 __ret = (uint16_t) __builtin_neon_vaddvq_u16(__p0); 45643 return __ret; 45644 } 45645 #else 45646 __ai __attribute__((target("neon"))) uint16_t vaddvq_u16(uint16x8_t __p0) { 45647 uint16_t __ret; 45648 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 45649 __ret = (uint16_t) __builtin_neon_vaddvq_u16(__rev0); 45650 return __ret; 45651 } 45652 #endif 45653 45654 #ifdef __LITTLE_ENDIAN__ 45655 __ai __attribute__((target("neon"))) int8_t vaddvq_s8(int8x16_t __p0) { 45656 int8_t __ret; 45657 __ret = (int8_t) __builtin_neon_vaddvq_s8(__p0); 45658 return __ret; 45659 } 45660 #else 45661 __ai __attribute__((target("neon"))) int8_t vaddvq_s8(int8x16_t __p0) { 45662 int8_t __ret; 45663 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 45664 __ret = (int8_t) __builtin_neon_vaddvq_s8(__rev0); 45665 return __ret; 45666 } 45667 #endif 45668 45669 #ifdef __LITTLE_ENDIAN__ 45670 __ai __attribute__((target("neon"))) float64_t vaddvq_f64(float64x2_t __p0) { 45671 float64_t __ret; 45672 __ret = (float64_t) __builtin_neon_vaddvq_f64(__p0); 45673 return __ret; 45674 } 45675 #else 45676 __ai __attribute__((target("neon"))) float64_t vaddvq_f64(float64x2_t __p0) { 45677 float64_t __ret; 45678 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 45679 __ret = (float64_t) __builtin_neon_vaddvq_f64(__rev0); 45680 return __ret; 45681 } 45682 #endif 45683 45684 #ifdef __LITTLE_ENDIAN__ 45685 __ai __attribute__((target("neon"))) float32_t vaddvq_f32(float32x4_t __p0) { 45686 float32_t __ret; 45687 __ret = (float32_t) __builtin_neon_vaddvq_f32(__p0); 45688 return __ret; 45689 } 45690 #else 45691 __ai __attribute__((target("neon"))) float32_t vaddvq_f32(float32x4_t __p0) { 45692 float32_t __ret; 45693 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 45694 __ret = (float32_t) __builtin_neon_vaddvq_f32(__rev0); 45695 return __ret; 45696 } 45697 #endif 45698 45699 #ifdef __LITTLE_ENDIAN__ 45700 __ai __attribute__((target("neon"))) int32_t vaddvq_s32(int32x4_t __p0) { 45701 int32_t __ret; 45702 __ret = (int32_t) __builtin_neon_vaddvq_s32(__p0); 45703 return __ret; 45704 } 45705 #else 45706 __ai __attribute__((target("neon"))) int32_t vaddvq_s32(int32x4_t __p0) { 45707 int32_t __ret; 45708 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 45709 __ret = (int32_t) __builtin_neon_vaddvq_s32(__rev0); 45710 return __ret; 45711 } 45712 #endif 45713 45714 #ifdef __LITTLE_ENDIAN__ 45715 __ai __attribute__((target("neon"))) int64_t vaddvq_s64(int64x2_t __p0) { 45716 int64_t __ret; 45717 __ret = (int64_t) __builtin_neon_vaddvq_s64(__p0); 45718 return __ret; 45719 } 45720 #else 45721 __ai __attribute__((target("neon"))) int64_t vaddvq_s64(int64x2_t __p0) { 45722 int64_t __ret; 45723 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 45724 __ret = (int64_t) __builtin_neon_vaddvq_s64(__rev0); 45725 return __ret; 45726 } 45727 #endif 45728 45729 #ifdef __LITTLE_ENDIAN__ 45730 __ai __attribute__((target("neon"))) int16_t vaddvq_s16(int16x8_t __p0) { 45731 int16_t __ret; 45732 __ret = (int16_t) __builtin_neon_vaddvq_s16(__p0); 45733 return __ret; 45734 } 45735 #else 45736 __ai __attribute__((target("neon"))) int16_t vaddvq_s16(int16x8_t __p0) { 45737 int16_t __ret; 45738 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 45739 __ret = (int16_t) __builtin_neon_vaddvq_s16(__rev0); 45740 return __ret; 45741 } 45742 #endif 45743 45744 #ifdef __LITTLE_ENDIAN__ 45745 __ai __attribute__((target("neon"))) uint8_t vaddv_u8(uint8x8_t __p0) { 45746 uint8_t __ret; 45747 __ret = (uint8_t) __builtin_neon_vaddv_u8(__p0); 45748 return __ret; 45749 } 45750 #else 45751 __ai __attribute__((target("neon"))) uint8_t vaddv_u8(uint8x8_t __p0) { 45752 uint8_t __ret; 45753 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 45754 __ret = (uint8_t) __builtin_neon_vaddv_u8(__rev0); 45755 return __ret; 45756 } 45757 #endif 45758 45759 #ifdef __LITTLE_ENDIAN__ 45760 __ai __attribute__((target("neon"))) uint32_t vaddv_u32(uint32x2_t __p0) { 45761 uint32_t __ret; 45762 __ret = (uint32_t) __builtin_neon_vaddv_u32(__p0); 45763 return __ret; 45764 } 45765 #else 45766 __ai __attribute__((target("neon"))) uint32_t vaddv_u32(uint32x2_t __p0) { 45767 uint32_t __ret; 45768 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 45769 __ret = (uint32_t) __builtin_neon_vaddv_u32(__rev0); 45770 return __ret; 45771 } 45772 #endif 45773 45774 #ifdef __LITTLE_ENDIAN__ 45775 __ai __attribute__((target("neon"))) uint16_t vaddv_u16(uint16x4_t __p0) { 45776 uint16_t __ret; 45777 __ret = (uint16_t) __builtin_neon_vaddv_u16(__p0); 45778 return __ret; 45779 } 45780 #else 45781 __ai __attribute__((target("neon"))) uint16_t vaddv_u16(uint16x4_t __p0) { 45782 uint16_t __ret; 45783 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 45784 __ret = (uint16_t) __builtin_neon_vaddv_u16(__rev0); 45785 return __ret; 45786 } 45787 #endif 45788 45789 #ifdef __LITTLE_ENDIAN__ 45790 __ai __attribute__((target("neon"))) int8_t vaddv_s8(int8x8_t __p0) { 45791 int8_t __ret; 45792 __ret = (int8_t) __builtin_neon_vaddv_s8(__p0); 45793 return __ret; 45794 } 45795 #else 45796 __ai __attribute__((target("neon"))) int8_t vaddv_s8(int8x8_t __p0) { 45797 int8_t __ret; 45798 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 45799 __ret = (int8_t) __builtin_neon_vaddv_s8(__rev0); 45800 return __ret; 45801 } 45802 #endif 45803 45804 #ifdef __LITTLE_ENDIAN__ 45805 __ai __attribute__((target("neon"))) float32_t vaddv_f32(float32x2_t __p0) { 45806 float32_t __ret; 45807 __ret = (float32_t) __builtin_neon_vaddv_f32(__p0); 45808 return __ret; 45809 } 45810 #else 45811 __ai __attribute__((target("neon"))) float32_t vaddv_f32(float32x2_t __p0) { 45812 float32_t __ret; 45813 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 45814 __ret = (float32_t) __builtin_neon_vaddv_f32(__rev0); 45815 return __ret; 45816 } 45817 #endif 45818 45819 #ifdef __LITTLE_ENDIAN__ 45820 __ai __attribute__((target("neon"))) int32_t vaddv_s32(int32x2_t __p0) { 45821 int32_t __ret; 45822 __ret = (int32_t) __builtin_neon_vaddv_s32(__p0); 45823 return __ret; 45824 } 45825 #else 45826 __ai __attribute__((target("neon"))) int32_t vaddv_s32(int32x2_t __p0) { 45827 int32_t __ret; 45828 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 45829 __ret = (int32_t) __builtin_neon_vaddv_s32(__rev0); 45830 return __ret; 45831 } 45832 #endif 45833 45834 #ifdef __LITTLE_ENDIAN__ 45835 __ai __attribute__((target("neon"))) int16_t vaddv_s16(int16x4_t __p0) { 45836 int16_t __ret; 45837 __ret = (int16_t) __builtin_neon_vaddv_s16(__p0); 45838 return __ret; 45839 } 45840 #else 45841 __ai __attribute__((target("neon"))) int16_t vaddv_s16(int16x4_t __p0) { 45842 int16_t __ret; 45843 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 45844 __ret = (int16_t) __builtin_neon_vaddv_s16(__rev0); 45845 return __ret; 45846 } 45847 #endif 45848 45849 __ai __attribute__((target("neon"))) poly64x1_t vbsl_p64(uint64x1_t __p0, poly64x1_t __p1, poly64x1_t __p2) { 45850 poly64x1_t __ret; 45851 __ret = (poly64x1_t) __builtin_neon_vbsl_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 6); 45852 return __ret; 45853 } 45854 #ifdef __LITTLE_ENDIAN__ 45855 __ai __attribute__((target("neon"))) poly64x2_t vbslq_p64(uint64x2_t __p0, poly64x2_t __p1, poly64x2_t __p2) { 45856 poly64x2_t __ret; 45857 __ret = (poly64x2_t) __builtin_neon_vbslq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 38); 45858 return __ret; 45859 } 45860 #else 45861 __ai __attribute__((target("neon"))) poly64x2_t vbslq_p64(uint64x2_t __p0, poly64x2_t __p1, poly64x2_t __p2) { 45862 poly64x2_t __ret; 45863 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 45864 poly64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 45865 poly64x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 45866 __ret = (poly64x2_t) __builtin_neon_vbslq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 38); 45867 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 45868 return __ret; 45869 } 45870 #endif 45871 45872 #ifdef __LITTLE_ENDIAN__ 45873 __ai __attribute__((target("neon"))) float64x2_t vbslq_f64(uint64x2_t __p0, float64x2_t __p1, float64x2_t __p2) { 45874 float64x2_t __ret; 45875 __ret = (float64x2_t) __builtin_neon_vbslq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 42); 45876 return __ret; 45877 } 45878 #else 45879 __ai __attribute__((target("neon"))) float64x2_t vbslq_f64(uint64x2_t __p0, float64x2_t __p1, float64x2_t __p2) { 45880 float64x2_t __ret; 45881 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 45882 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 45883 float64x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 45884 __ret = (float64x2_t) __builtin_neon_vbslq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 42); 45885 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 45886 return __ret; 45887 } 45888 #endif 45889 45890 __ai __attribute__((target("neon"))) float64x1_t vbsl_f64(uint64x1_t __p0, float64x1_t __p1, float64x1_t __p2) { 45891 float64x1_t __ret; 45892 __ret = (float64x1_t) __builtin_neon_vbsl_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 10); 45893 return __ret; 45894 } 45895 #ifdef __LITTLE_ENDIAN__ 45896 __ai __attribute__((target("neon"))) uint64x2_t vcageq_f64(float64x2_t __p0, float64x2_t __p1) { 45897 uint64x2_t __ret; 45898 __ret = (uint64x2_t) __builtin_neon_vcageq_v((int8x16_t)__p0, (int8x16_t)__p1, 51); 45899 return __ret; 45900 } 45901 #else 45902 __ai __attribute__((target("neon"))) uint64x2_t vcageq_f64(float64x2_t __p0, float64x2_t __p1) { 45903 uint64x2_t __ret; 45904 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 45905 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 45906 __ret = (uint64x2_t) __builtin_neon_vcageq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 51); 45907 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 45908 return __ret; 45909 } 45910 #endif 45911 45912 __ai __attribute__((target("neon"))) uint64x1_t vcage_f64(float64x1_t __p0, float64x1_t __p1) { 45913 uint64x1_t __ret; 45914 __ret = (uint64x1_t) __builtin_neon_vcage_v((int8x8_t)__p0, (int8x8_t)__p1, 19); 45915 return __ret; 45916 } 45917 __ai __attribute__((target("neon"))) uint64_t vcaged_f64(float64_t __p0, float64_t __p1) { 45918 uint64_t __ret; 45919 __ret = (uint64_t) __builtin_neon_vcaged_f64(__p0, __p1); 45920 return __ret; 45921 } 45922 __ai __attribute__((target("neon"))) uint32_t vcages_f32(float32_t __p0, float32_t __p1) { 45923 uint32_t __ret; 45924 __ret = (uint32_t) __builtin_neon_vcages_f32(__p0, __p1); 45925 return __ret; 45926 } 45927 #ifdef __LITTLE_ENDIAN__ 45928 __ai __attribute__((target("neon"))) uint64x2_t vcagtq_f64(float64x2_t __p0, float64x2_t __p1) { 45929 uint64x2_t __ret; 45930 __ret = (uint64x2_t) __builtin_neon_vcagtq_v((int8x16_t)__p0, (int8x16_t)__p1, 51); 45931 return __ret; 45932 } 45933 #else 45934 __ai __attribute__((target("neon"))) uint64x2_t vcagtq_f64(float64x2_t __p0, float64x2_t __p1) { 45935 uint64x2_t __ret; 45936 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 45937 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 45938 __ret = (uint64x2_t) __builtin_neon_vcagtq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 51); 45939 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 45940 return __ret; 45941 } 45942 #endif 45943 45944 __ai __attribute__((target("neon"))) uint64x1_t vcagt_f64(float64x1_t __p0, float64x1_t __p1) { 45945 uint64x1_t __ret; 45946 __ret = (uint64x1_t) __builtin_neon_vcagt_v((int8x8_t)__p0, (int8x8_t)__p1, 19); 45947 return __ret; 45948 } 45949 __ai __attribute__((target("neon"))) uint64_t vcagtd_f64(float64_t __p0, float64_t __p1) { 45950 uint64_t __ret; 45951 __ret = (uint64_t) __builtin_neon_vcagtd_f64(__p0, __p1); 45952 return __ret; 45953 } 45954 __ai __attribute__((target("neon"))) uint32_t vcagts_f32(float32_t __p0, float32_t __p1) { 45955 uint32_t __ret; 45956 __ret = (uint32_t) __builtin_neon_vcagts_f32(__p0, __p1); 45957 return __ret; 45958 } 45959 #ifdef __LITTLE_ENDIAN__ 45960 __ai __attribute__((target("neon"))) uint64x2_t vcaleq_f64(float64x2_t __p0, float64x2_t __p1) { 45961 uint64x2_t __ret; 45962 __ret = (uint64x2_t) __builtin_neon_vcaleq_v((int8x16_t)__p0, (int8x16_t)__p1, 51); 45963 return __ret; 45964 } 45965 #else 45966 __ai __attribute__((target("neon"))) uint64x2_t vcaleq_f64(float64x2_t __p0, float64x2_t __p1) { 45967 uint64x2_t __ret; 45968 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 45969 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 45970 __ret = (uint64x2_t) __builtin_neon_vcaleq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 51); 45971 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 45972 return __ret; 45973 } 45974 #endif 45975 45976 __ai __attribute__((target("neon"))) uint64x1_t vcale_f64(float64x1_t __p0, float64x1_t __p1) { 45977 uint64x1_t __ret; 45978 __ret = (uint64x1_t) __builtin_neon_vcale_v((int8x8_t)__p0, (int8x8_t)__p1, 19); 45979 return __ret; 45980 } 45981 __ai __attribute__((target("neon"))) uint64_t vcaled_f64(float64_t __p0, float64_t __p1) { 45982 uint64_t __ret; 45983 __ret = (uint64_t) __builtin_neon_vcaled_f64(__p0, __p1); 45984 return __ret; 45985 } 45986 __ai __attribute__((target("neon"))) uint32_t vcales_f32(float32_t __p0, float32_t __p1) { 45987 uint32_t __ret; 45988 __ret = (uint32_t) __builtin_neon_vcales_f32(__p0, __p1); 45989 return __ret; 45990 } 45991 #ifdef __LITTLE_ENDIAN__ 45992 __ai __attribute__((target("neon"))) uint64x2_t vcaltq_f64(float64x2_t __p0, float64x2_t __p1) { 45993 uint64x2_t __ret; 45994 __ret = (uint64x2_t) __builtin_neon_vcaltq_v((int8x16_t)__p0, (int8x16_t)__p1, 51); 45995 return __ret; 45996 } 45997 #else 45998 __ai __attribute__((target("neon"))) uint64x2_t vcaltq_f64(float64x2_t __p0, float64x2_t __p1) { 45999 uint64x2_t __ret; 46000 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 46001 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 46002 __ret = (uint64x2_t) __builtin_neon_vcaltq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 51); 46003 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 46004 return __ret; 46005 } 46006 #endif 46007 46008 __ai __attribute__((target("neon"))) uint64x1_t vcalt_f64(float64x1_t __p0, float64x1_t __p1) { 46009 uint64x1_t __ret; 46010 __ret = (uint64x1_t) __builtin_neon_vcalt_v((int8x8_t)__p0, (int8x8_t)__p1, 19); 46011 return __ret; 46012 } 46013 __ai __attribute__((target("neon"))) uint64_t vcaltd_f64(float64_t __p0, float64_t __p1) { 46014 uint64_t __ret; 46015 __ret = (uint64_t) __builtin_neon_vcaltd_f64(__p0, __p1); 46016 return __ret; 46017 } 46018 __ai __attribute__((target("neon"))) uint32_t vcalts_f32(float32_t __p0, float32_t __p1) { 46019 uint32_t __ret; 46020 __ret = (uint32_t) __builtin_neon_vcalts_f32(__p0, __p1); 46021 return __ret; 46022 } 46023 __ai __attribute__((target("neon"))) uint64x1_t vceq_p64(poly64x1_t __p0, poly64x1_t __p1) { 46024 uint64x1_t __ret; 46025 __ret = (uint64x1_t)(__p0 == __p1); 46026 return __ret; 46027 } 46028 #ifdef __LITTLE_ENDIAN__ 46029 __ai __attribute__((target("neon"))) uint64x2_t vceqq_p64(poly64x2_t __p0, poly64x2_t __p1) { 46030 uint64x2_t __ret; 46031 __ret = (uint64x2_t)(__p0 == __p1); 46032 return __ret; 46033 } 46034 #else 46035 __ai __attribute__((target("neon"))) uint64x2_t vceqq_p64(poly64x2_t __p0, poly64x2_t __p1) { 46036 uint64x2_t __ret; 46037 poly64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 46038 poly64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 46039 __ret = (uint64x2_t)(__rev0 == __rev1); 46040 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 46041 return __ret; 46042 } 46043 #endif 46044 46045 #ifdef __LITTLE_ENDIAN__ 46046 __ai __attribute__((target("neon"))) uint64x2_t vceqq_u64(uint64x2_t __p0, uint64x2_t __p1) { 46047 uint64x2_t __ret; 46048 __ret = (uint64x2_t)(__p0 == __p1); 46049 return __ret; 46050 } 46051 #else 46052 __ai __attribute__((target("neon"))) uint64x2_t vceqq_u64(uint64x2_t __p0, uint64x2_t __p1) { 46053 uint64x2_t __ret; 46054 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 46055 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 46056 __ret = (uint64x2_t)(__rev0 == __rev1); 46057 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 46058 return __ret; 46059 } 46060 #endif 46061 46062 #ifdef __LITTLE_ENDIAN__ 46063 __ai __attribute__((target("neon"))) uint64x2_t vceqq_f64(float64x2_t __p0, float64x2_t __p1) { 46064 uint64x2_t __ret; 46065 __ret = (uint64x2_t)(__p0 == __p1); 46066 return __ret; 46067 } 46068 #else 46069 __ai __attribute__((target("neon"))) uint64x2_t vceqq_f64(float64x2_t __p0, float64x2_t __p1) { 46070 uint64x2_t __ret; 46071 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 46072 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 46073 __ret = (uint64x2_t)(__rev0 == __rev1); 46074 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 46075 return __ret; 46076 } 46077 #endif 46078 46079 #ifdef __LITTLE_ENDIAN__ 46080 __ai __attribute__((target("neon"))) uint64x2_t vceqq_s64(int64x2_t __p0, int64x2_t __p1) { 46081 uint64x2_t __ret; 46082 __ret = (uint64x2_t)(__p0 == __p1); 46083 return __ret; 46084 } 46085 #else 46086 __ai __attribute__((target("neon"))) uint64x2_t vceqq_s64(int64x2_t __p0, int64x2_t __p1) { 46087 uint64x2_t __ret; 46088 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 46089 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 46090 __ret = (uint64x2_t)(__rev0 == __rev1); 46091 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 46092 return __ret; 46093 } 46094 #endif 46095 46096 __ai __attribute__((target("neon"))) uint64x1_t vceq_u64(uint64x1_t __p0, uint64x1_t __p1) { 46097 uint64x1_t __ret; 46098 __ret = (uint64x1_t)(__p0 == __p1); 46099 return __ret; 46100 } 46101 __ai __attribute__((target("neon"))) uint64x1_t vceq_f64(float64x1_t __p0, float64x1_t __p1) { 46102 uint64x1_t __ret; 46103 __ret = (uint64x1_t)(__p0 == __p1); 46104 return __ret; 46105 } 46106 __ai __attribute__((target("neon"))) uint64x1_t vceq_s64(int64x1_t __p0, int64x1_t __p1) { 46107 uint64x1_t __ret; 46108 __ret = (uint64x1_t)(__p0 == __p1); 46109 return __ret; 46110 } 46111 __ai __attribute__((target("neon"))) uint64_t vceqd_u64(uint64_t __p0, uint64_t __p1) { 46112 uint64_t __ret; 46113 __ret = (uint64_t) __builtin_neon_vceqd_u64(__p0, __p1); 46114 return __ret; 46115 } 46116 __ai __attribute__((target("neon"))) uint64_t vceqd_s64(int64_t __p0, int64_t __p1) { 46117 uint64_t __ret; 46118 __ret = (uint64_t) __builtin_neon_vceqd_s64(__p0, __p1); 46119 return __ret; 46120 } 46121 __ai __attribute__((target("neon"))) uint64_t vceqd_f64(float64_t __p0, float64_t __p1) { 46122 uint64_t __ret; 46123 __ret = (uint64_t) __builtin_neon_vceqd_f64(__p0, __p1); 46124 return __ret; 46125 } 46126 __ai __attribute__((target("neon"))) uint32_t vceqs_f32(float32_t __p0, float32_t __p1) { 46127 uint32_t __ret; 46128 __ret = (uint32_t) __builtin_neon_vceqs_f32(__p0, __p1); 46129 return __ret; 46130 } 46131 #ifdef __LITTLE_ENDIAN__ 46132 __ai __attribute__((target("neon"))) uint8x8_t vceqz_p8(poly8x8_t __p0) { 46133 uint8x8_t __ret; 46134 __ret = (uint8x8_t) __builtin_neon_vceqz_v((int8x8_t)__p0, 16); 46135 return __ret; 46136 } 46137 #else 46138 __ai __attribute__((target("neon"))) uint8x8_t vceqz_p8(poly8x8_t __p0) { 46139 uint8x8_t __ret; 46140 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 46141 __ret = (uint8x8_t) __builtin_neon_vceqz_v((int8x8_t)__rev0, 16); 46142 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 46143 return __ret; 46144 } 46145 #endif 46146 46147 __ai __attribute__((target("neon"))) uint64x1_t vceqz_p64(poly64x1_t __p0) { 46148 uint64x1_t __ret; 46149 __ret = (uint64x1_t) __builtin_neon_vceqz_v((int8x8_t)__p0, 19); 46150 return __ret; 46151 } 46152 #ifdef __LITTLE_ENDIAN__ 46153 __ai __attribute__((target("neon"))) uint8x16_t vceqzq_p8(poly8x16_t __p0) { 46154 uint8x16_t __ret; 46155 __ret = (uint8x16_t) __builtin_neon_vceqzq_v((int8x16_t)__p0, 48); 46156 return __ret; 46157 } 46158 #else 46159 __ai __attribute__((target("neon"))) uint8x16_t vceqzq_p8(poly8x16_t __p0) { 46160 uint8x16_t __ret; 46161 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 46162 __ret = (uint8x16_t) __builtin_neon_vceqzq_v((int8x16_t)__rev0, 48); 46163 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 46164 return __ret; 46165 } 46166 #endif 46167 46168 #ifdef __LITTLE_ENDIAN__ 46169 __ai __attribute__((target("neon"))) uint64x2_t vceqzq_p64(poly64x2_t __p0) { 46170 uint64x2_t __ret; 46171 __ret = (uint64x2_t) __builtin_neon_vceqzq_v((int8x16_t)__p0, 51); 46172 return __ret; 46173 } 46174 #else 46175 __ai __attribute__((target("neon"))) uint64x2_t vceqzq_p64(poly64x2_t __p0) { 46176 uint64x2_t __ret; 46177 poly64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 46178 __ret = (uint64x2_t) __builtin_neon_vceqzq_v((int8x16_t)__rev0, 51); 46179 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 46180 return __ret; 46181 } 46182 #endif 46183 46184 #ifdef __LITTLE_ENDIAN__ 46185 __ai __attribute__((target("neon"))) uint8x16_t vceqzq_u8(uint8x16_t __p0) { 46186 uint8x16_t __ret; 46187 __ret = (uint8x16_t) __builtin_neon_vceqzq_v((int8x16_t)__p0, 48); 46188 return __ret; 46189 } 46190 #else 46191 __ai __attribute__((target("neon"))) uint8x16_t vceqzq_u8(uint8x16_t __p0) { 46192 uint8x16_t __ret; 46193 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 46194 __ret = (uint8x16_t) __builtin_neon_vceqzq_v((int8x16_t)__rev0, 48); 46195 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 46196 return __ret; 46197 } 46198 #endif 46199 46200 #ifdef __LITTLE_ENDIAN__ 46201 __ai __attribute__((target("neon"))) uint32x4_t vceqzq_u32(uint32x4_t __p0) { 46202 uint32x4_t __ret; 46203 __ret = (uint32x4_t) __builtin_neon_vceqzq_v((int8x16_t)__p0, 50); 46204 return __ret; 46205 } 46206 #else 46207 __ai __attribute__((target("neon"))) uint32x4_t vceqzq_u32(uint32x4_t __p0) { 46208 uint32x4_t __ret; 46209 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 46210 __ret = (uint32x4_t) __builtin_neon_vceqzq_v((int8x16_t)__rev0, 50); 46211 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 46212 return __ret; 46213 } 46214 #endif 46215 46216 #ifdef __LITTLE_ENDIAN__ 46217 __ai __attribute__((target("neon"))) uint64x2_t vceqzq_u64(uint64x2_t __p0) { 46218 uint64x2_t __ret; 46219 __ret = (uint64x2_t) __builtin_neon_vceqzq_v((int8x16_t)__p0, 51); 46220 return __ret; 46221 } 46222 #else 46223 __ai __attribute__((target("neon"))) uint64x2_t vceqzq_u64(uint64x2_t __p0) { 46224 uint64x2_t __ret; 46225 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 46226 __ret = (uint64x2_t) __builtin_neon_vceqzq_v((int8x16_t)__rev0, 51); 46227 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 46228 return __ret; 46229 } 46230 #endif 46231 46232 #ifdef __LITTLE_ENDIAN__ 46233 __ai __attribute__((target("neon"))) uint16x8_t vceqzq_u16(uint16x8_t __p0) { 46234 uint16x8_t __ret; 46235 __ret = (uint16x8_t) __builtin_neon_vceqzq_v((int8x16_t)__p0, 49); 46236 return __ret; 46237 } 46238 #else 46239 __ai __attribute__((target("neon"))) uint16x8_t vceqzq_u16(uint16x8_t __p0) { 46240 uint16x8_t __ret; 46241 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 46242 __ret = (uint16x8_t) __builtin_neon_vceqzq_v((int8x16_t)__rev0, 49); 46243 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 46244 return __ret; 46245 } 46246 #endif 46247 46248 #ifdef __LITTLE_ENDIAN__ 46249 __ai __attribute__((target("neon"))) uint8x16_t vceqzq_s8(int8x16_t __p0) { 46250 uint8x16_t __ret; 46251 __ret = (uint8x16_t) __builtin_neon_vceqzq_v((int8x16_t)__p0, 48); 46252 return __ret; 46253 } 46254 #else 46255 __ai __attribute__((target("neon"))) uint8x16_t vceqzq_s8(int8x16_t __p0) { 46256 uint8x16_t __ret; 46257 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 46258 __ret = (uint8x16_t) __builtin_neon_vceqzq_v((int8x16_t)__rev0, 48); 46259 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 46260 return __ret; 46261 } 46262 #endif 46263 46264 #ifdef __LITTLE_ENDIAN__ 46265 __ai __attribute__((target("neon"))) uint64x2_t vceqzq_f64(float64x2_t __p0) { 46266 uint64x2_t __ret; 46267 __ret = (uint64x2_t) __builtin_neon_vceqzq_v((int8x16_t)__p0, 51); 46268 return __ret; 46269 } 46270 #else 46271 __ai __attribute__((target("neon"))) uint64x2_t vceqzq_f64(float64x2_t __p0) { 46272 uint64x2_t __ret; 46273 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 46274 __ret = (uint64x2_t) __builtin_neon_vceqzq_v((int8x16_t)__rev0, 51); 46275 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 46276 return __ret; 46277 } 46278 #endif 46279 46280 #ifdef __LITTLE_ENDIAN__ 46281 __ai __attribute__((target("neon"))) uint32x4_t vceqzq_f32(float32x4_t __p0) { 46282 uint32x4_t __ret; 46283 __ret = (uint32x4_t) __builtin_neon_vceqzq_v((int8x16_t)__p0, 50); 46284 return __ret; 46285 } 46286 #else 46287 __ai __attribute__((target("neon"))) uint32x4_t vceqzq_f32(float32x4_t __p0) { 46288 uint32x4_t __ret; 46289 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 46290 __ret = (uint32x4_t) __builtin_neon_vceqzq_v((int8x16_t)__rev0, 50); 46291 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 46292 return __ret; 46293 } 46294 #endif 46295 46296 #ifdef __LITTLE_ENDIAN__ 46297 __ai __attribute__((target("neon"))) uint32x4_t vceqzq_s32(int32x4_t __p0) { 46298 uint32x4_t __ret; 46299 __ret = (uint32x4_t) __builtin_neon_vceqzq_v((int8x16_t)__p0, 50); 46300 return __ret; 46301 } 46302 #else 46303 __ai __attribute__((target("neon"))) uint32x4_t vceqzq_s32(int32x4_t __p0) { 46304 uint32x4_t __ret; 46305 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 46306 __ret = (uint32x4_t) __builtin_neon_vceqzq_v((int8x16_t)__rev0, 50); 46307 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 46308 return __ret; 46309 } 46310 #endif 46311 46312 #ifdef __LITTLE_ENDIAN__ 46313 __ai __attribute__((target("neon"))) uint64x2_t vceqzq_s64(int64x2_t __p0) { 46314 uint64x2_t __ret; 46315 __ret = (uint64x2_t) __builtin_neon_vceqzq_v((int8x16_t)__p0, 51); 46316 return __ret; 46317 } 46318 #else 46319 __ai __attribute__((target("neon"))) uint64x2_t vceqzq_s64(int64x2_t __p0) { 46320 uint64x2_t __ret; 46321 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 46322 __ret = (uint64x2_t) __builtin_neon_vceqzq_v((int8x16_t)__rev0, 51); 46323 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 46324 return __ret; 46325 } 46326 #endif 46327 46328 #ifdef __LITTLE_ENDIAN__ 46329 __ai __attribute__((target("neon"))) uint16x8_t vceqzq_s16(int16x8_t __p0) { 46330 uint16x8_t __ret; 46331 __ret = (uint16x8_t) __builtin_neon_vceqzq_v((int8x16_t)__p0, 49); 46332 return __ret; 46333 } 46334 #else 46335 __ai __attribute__((target("neon"))) uint16x8_t vceqzq_s16(int16x8_t __p0) { 46336 uint16x8_t __ret; 46337 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 46338 __ret = (uint16x8_t) __builtin_neon_vceqzq_v((int8x16_t)__rev0, 49); 46339 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 46340 return __ret; 46341 } 46342 #endif 46343 46344 #ifdef __LITTLE_ENDIAN__ 46345 __ai __attribute__((target("neon"))) uint8x8_t vceqz_u8(uint8x8_t __p0) { 46346 uint8x8_t __ret; 46347 __ret = (uint8x8_t) __builtin_neon_vceqz_v((int8x8_t)__p0, 16); 46348 return __ret; 46349 } 46350 #else 46351 __ai __attribute__((target("neon"))) uint8x8_t vceqz_u8(uint8x8_t __p0) { 46352 uint8x8_t __ret; 46353 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 46354 __ret = (uint8x8_t) __builtin_neon_vceqz_v((int8x8_t)__rev0, 16); 46355 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 46356 return __ret; 46357 } 46358 #endif 46359 46360 #ifdef __LITTLE_ENDIAN__ 46361 __ai __attribute__((target("neon"))) uint32x2_t vceqz_u32(uint32x2_t __p0) { 46362 uint32x2_t __ret; 46363 __ret = (uint32x2_t) __builtin_neon_vceqz_v((int8x8_t)__p0, 18); 46364 return __ret; 46365 } 46366 #else 46367 __ai __attribute__((target("neon"))) uint32x2_t vceqz_u32(uint32x2_t __p0) { 46368 uint32x2_t __ret; 46369 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 46370 __ret = (uint32x2_t) __builtin_neon_vceqz_v((int8x8_t)__rev0, 18); 46371 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 46372 return __ret; 46373 } 46374 #endif 46375 46376 __ai __attribute__((target("neon"))) uint64x1_t vceqz_u64(uint64x1_t __p0) { 46377 uint64x1_t __ret; 46378 __ret = (uint64x1_t) __builtin_neon_vceqz_v((int8x8_t)__p0, 19); 46379 return __ret; 46380 } 46381 #ifdef __LITTLE_ENDIAN__ 46382 __ai __attribute__((target("neon"))) uint16x4_t vceqz_u16(uint16x4_t __p0) { 46383 uint16x4_t __ret; 46384 __ret = (uint16x4_t) __builtin_neon_vceqz_v((int8x8_t)__p0, 17); 46385 return __ret; 46386 } 46387 #else 46388 __ai __attribute__((target("neon"))) uint16x4_t vceqz_u16(uint16x4_t __p0) { 46389 uint16x4_t __ret; 46390 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 46391 __ret = (uint16x4_t) __builtin_neon_vceqz_v((int8x8_t)__rev0, 17); 46392 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 46393 return __ret; 46394 } 46395 #endif 46396 46397 #ifdef __LITTLE_ENDIAN__ 46398 __ai __attribute__((target("neon"))) uint8x8_t vceqz_s8(int8x8_t __p0) { 46399 uint8x8_t __ret; 46400 __ret = (uint8x8_t) __builtin_neon_vceqz_v((int8x8_t)__p0, 16); 46401 return __ret; 46402 } 46403 #else 46404 __ai __attribute__((target("neon"))) uint8x8_t vceqz_s8(int8x8_t __p0) { 46405 uint8x8_t __ret; 46406 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 46407 __ret = (uint8x8_t) __builtin_neon_vceqz_v((int8x8_t)__rev0, 16); 46408 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 46409 return __ret; 46410 } 46411 #endif 46412 46413 __ai __attribute__((target("neon"))) uint64x1_t vceqz_f64(float64x1_t __p0) { 46414 uint64x1_t __ret; 46415 __ret = (uint64x1_t) __builtin_neon_vceqz_v((int8x8_t)__p0, 19); 46416 return __ret; 46417 } 46418 #ifdef __LITTLE_ENDIAN__ 46419 __ai __attribute__((target("neon"))) uint32x2_t vceqz_f32(float32x2_t __p0) { 46420 uint32x2_t __ret; 46421 __ret = (uint32x2_t) __builtin_neon_vceqz_v((int8x8_t)__p0, 18); 46422 return __ret; 46423 } 46424 #else 46425 __ai __attribute__((target("neon"))) uint32x2_t vceqz_f32(float32x2_t __p0) { 46426 uint32x2_t __ret; 46427 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 46428 __ret = (uint32x2_t) __builtin_neon_vceqz_v((int8x8_t)__rev0, 18); 46429 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 46430 return __ret; 46431 } 46432 #endif 46433 46434 #ifdef __LITTLE_ENDIAN__ 46435 __ai __attribute__((target("neon"))) uint32x2_t vceqz_s32(int32x2_t __p0) { 46436 uint32x2_t __ret; 46437 __ret = (uint32x2_t) __builtin_neon_vceqz_v((int8x8_t)__p0, 18); 46438 return __ret; 46439 } 46440 #else 46441 __ai __attribute__((target("neon"))) uint32x2_t vceqz_s32(int32x2_t __p0) { 46442 uint32x2_t __ret; 46443 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 46444 __ret = (uint32x2_t) __builtin_neon_vceqz_v((int8x8_t)__rev0, 18); 46445 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 46446 return __ret; 46447 } 46448 #endif 46449 46450 __ai __attribute__((target("neon"))) uint64x1_t vceqz_s64(int64x1_t __p0) { 46451 uint64x1_t __ret; 46452 __ret = (uint64x1_t) __builtin_neon_vceqz_v((int8x8_t)__p0, 19); 46453 return __ret; 46454 } 46455 #ifdef __LITTLE_ENDIAN__ 46456 __ai __attribute__((target("neon"))) uint16x4_t vceqz_s16(int16x4_t __p0) { 46457 uint16x4_t __ret; 46458 __ret = (uint16x4_t) __builtin_neon_vceqz_v((int8x8_t)__p0, 17); 46459 return __ret; 46460 } 46461 #else 46462 __ai __attribute__((target("neon"))) uint16x4_t vceqz_s16(int16x4_t __p0) { 46463 uint16x4_t __ret; 46464 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 46465 __ret = (uint16x4_t) __builtin_neon_vceqz_v((int8x8_t)__rev0, 17); 46466 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 46467 return __ret; 46468 } 46469 #endif 46470 46471 __ai __attribute__((target("neon"))) uint64_t vceqzd_u64(uint64_t __p0) { 46472 uint64_t __ret; 46473 __ret = (uint64_t) __builtin_neon_vceqzd_u64(__p0); 46474 return __ret; 46475 } 46476 __ai __attribute__((target("neon"))) uint64_t vceqzd_s64(int64_t __p0) { 46477 uint64_t __ret; 46478 __ret = (uint64_t) __builtin_neon_vceqzd_s64(__p0); 46479 return __ret; 46480 } 46481 __ai __attribute__((target("neon"))) uint64_t vceqzd_f64(float64_t __p0) { 46482 uint64_t __ret; 46483 __ret = (uint64_t) __builtin_neon_vceqzd_f64(__p0); 46484 return __ret; 46485 } 46486 __ai __attribute__((target("neon"))) uint32_t vceqzs_f32(float32_t __p0) { 46487 uint32_t __ret; 46488 __ret = (uint32_t) __builtin_neon_vceqzs_f32(__p0); 46489 return __ret; 46490 } 46491 #ifdef __LITTLE_ENDIAN__ 46492 __ai __attribute__((target("neon"))) uint64x2_t vcgeq_u64(uint64x2_t __p0, uint64x2_t __p1) { 46493 uint64x2_t __ret; 46494 __ret = (uint64x2_t)(__p0 >= __p1); 46495 return __ret; 46496 } 46497 #else 46498 __ai __attribute__((target("neon"))) uint64x2_t vcgeq_u64(uint64x2_t __p0, uint64x2_t __p1) { 46499 uint64x2_t __ret; 46500 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 46501 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 46502 __ret = (uint64x2_t)(__rev0 >= __rev1); 46503 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 46504 return __ret; 46505 } 46506 #endif 46507 46508 #ifdef __LITTLE_ENDIAN__ 46509 __ai __attribute__((target("neon"))) uint64x2_t vcgeq_f64(float64x2_t __p0, float64x2_t __p1) { 46510 uint64x2_t __ret; 46511 __ret = (uint64x2_t)(__p0 >= __p1); 46512 return __ret; 46513 } 46514 #else 46515 __ai __attribute__((target("neon"))) uint64x2_t vcgeq_f64(float64x2_t __p0, float64x2_t __p1) { 46516 uint64x2_t __ret; 46517 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 46518 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 46519 __ret = (uint64x2_t)(__rev0 >= __rev1); 46520 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 46521 return __ret; 46522 } 46523 #endif 46524 46525 #ifdef __LITTLE_ENDIAN__ 46526 __ai __attribute__((target("neon"))) uint64x2_t vcgeq_s64(int64x2_t __p0, int64x2_t __p1) { 46527 uint64x2_t __ret; 46528 __ret = (uint64x2_t)(__p0 >= __p1); 46529 return __ret; 46530 } 46531 #else 46532 __ai __attribute__((target("neon"))) uint64x2_t vcgeq_s64(int64x2_t __p0, int64x2_t __p1) { 46533 uint64x2_t __ret; 46534 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 46535 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 46536 __ret = (uint64x2_t)(__rev0 >= __rev1); 46537 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 46538 return __ret; 46539 } 46540 #endif 46541 46542 __ai __attribute__((target("neon"))) uint64x1_t vcge_u64(uint64x1_t __p0, uint64x1_t __p1) { 46543 uint64x1_t __ret; 46544 __ret = (uint64x1_t)(__p0 >= __p1); 46545 return __ret; 46546 } 46547 __ai __attribute__((target("neon"))) uint64x1_t vcge_f64(float64x1_t __p0, float64x1_t __p1) { 46548 uint64x1_t __ret; 46549 __ret = (uint64x1_t)(__p0 >= __p1); 46550 return __ret; 46551 } 46552 __ai __attribute__((target("neon"))) uint64x1_t vcge_s64(int64x1_t __p0, int64x1_t __p1) { 46553 uint64x1_t __ret; 46554 __ret = (uint64x1_t)(__p0 >= __p1); 46555 return __ret; 46556 } 46557 __ai __attribute__((target("neon"))) uint64_t vcged_s64(int64_t __p0, int64_t __p1) { 46558 uint64_t __ret; 46559 __ret = (uint64_t) __builtin_neon_vcged_s64(__p0, __p1); 46560 return __ret; 46561 } 46562 __ai __attribute__((target("neon"))) uint64_t vcged_u64(uint64_t __p0, uint64_t __p1) { 46563 uint64_t __ret; 46564 __ret = (uint64_t) __builtin_neon_vcged_u64(__p0, __p1); 46565 return __ret; 46566 } 46567 __ai __attribute__((target("neon"))) uint64_t vcged_f64(float64_t __p0, float64_t __p1) { 46568 uint64_t __ret; 46569 __ret = (uint64_t) __builtin_neon_vcged_f64(__p0, __p1); 46570 return __ret; 46571 } 46572 __ai __attribute__((target("neon"))) uint32_t vcges_f32(float32_t __p0, float32_t __p1) { 46573 uint32_t __ret; 46574 __ret = (uint32_t) __builtin_neon_vcges_f32(__p0, __p1); 46575 return __ret; 46576 } 46577 #ifdef __LITTLE_ENDIAN__ 46578 __ai __attribute__((target("neon"))) uint8x16_t vcgezq_s8(int8x16_t __p0) { 46579 uint8x16_t __ret; 46580 __ret = (uint8x16_t) __builtin_neon_vcgezq_v((int8x16_t)__p0, 48); 46581 return __ret; 46582 } 46583 #else 46584 __ai __attribute__((target("neon"))) uint8x16_t vcgezq_s8(int8x16_t __p0) { 46585 uint8x16_t __ret; 46586 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 46587 __ret = (uint8x16_t) __builtin_neon_vcgezq_v((int8x16_t)__rev0, 48); 46588 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 46589 return __ret; 46590 } 46591 #endif 46592 46593 #ifdef __LITTLE_ENDIAN__ 46594 __ai __attribute__((target("neon"))) uint64x2_t vcgezq_f64(float64x2_t __p0) { 46595 uint64x2_t __ret; 46596 __ret = (uint64x2_t) __builtin_neon_vcgezq_v((int8x16_t)__p0, 51); 46597 return __ret; 46598 } 46599 #else 46600 __ai __attribute__((target("neon"))) uint64x2_t vcgezq_f64(float64x2_t __p0) { 46601 uint64x2_t __ret; 46602 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 46603 __ret = (uint64x2_t) __builtin_neon_vcgezq_v((int8x16_t)__rev0, 51); 46604 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 46605 return __ret; 46606 } 46607 #endif 46608 46609 #ifdef __LITTLE_ENDIAN__ 46610 __ai __attribute__((target("neon"))) uint32x4_t vcgezq_f32(float32x4_t __p0) { 46611 uint32x4_t __ret; 46612 __ret = (uint32x4_t) __builtin_neon_vcgezq_v((int8x16_t)__p0, 50); 46613 return __ret; 46614 } 46615 #else 46616 __ai __attribute__((target("neon"))) uint32x4_t vcgezq_f32(float32x4_t __p0) { 46617 uint32x4_t __ret; 46618 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 46619 __ret = (uint32x4_t) __builtin_neon_vcgezq_v((int8x16_t)__rev0, 50); 46620 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 46621 return __ret; 46622 } 46623 #endif 46624 46625 #ifdef __LITTLE_ENDIAN__ 46626 __ai __attribute__((target("neon"))) uint32x4_t vcgezq_s32(int32x4_t __p0) { 46627 uint32x4_t __ret; 46628 __ret = (uint32x4_t) __builtin_neon_vcgezq_v((int8x16_t)__p0, 50); 46629 return __ret; 46630 } 46631 #else 46632 __ai __attribute__((target("neon"))) uint32x4_t vcgezq_s32(int32x4_t __p0) { 46633 uint32x4_t __ret; 46634 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 46635 __ret = (uint32x4_t) __builtin_neon_vcgezq_v((int8x16_t)__rev0, 50); 46636 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 46637 return __ret; 46638 } 46639 #endif 46640 46641 #ifdef __LITTLE_ENDIAN__ 46642 __ai __attribute__((target("neon"))) uint64x2_t vcgezq_s64(int64x2_t __p0) { 46643 uint64x2_t __ret; 46644 __ret = (uint64x2_t) __builtin_neon_vcgezq_v((int8x16_t)__p0, 51); 46645 return __ret; 46646 } 46647 #else 46648 __ai __attribute__((target("neon"))) uint64x2_t vcgezq_s64(int64x2_t __p0) { 46649 uint64x2_t __ret; 46650 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 46651 __ret = (uint64x2_t) __builtin_neon_vcgezq_v((int8x16_t)__rev0, 51); 46652 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 46653 return __ret; 46654 } 46655 #endif 46656 46657 #ifdef __LITTLE_ENDIAN__ 46658 __ai __attribute__((target("neon"))) uint16x8_t vcgezq_s16(int16x8_t __p0) { 46659 uint16x8_t __ret; 46660 __ret = (uint16x8_t) __builtin_neon_vcgezq_v((int8x16_t)__p0, 49); 46661 return __ret; 46662 } 46663 #else 46664 __ai __attribute__((target("neon"))) uint16x8_t vcgezq_s16(int16x8_t __p0) { 46665 uint16x8_t __ret; 46666 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 46667 __ret = (uint16x8_t) __builtin_neon_vcgezq_v((int8x16_t)__rev0, 49); 46668 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 46669 return __ret; 46670 } 46671 #endif 46672 46673 #ifdef __LITTLE_ENDIAN__ 46674 __ai __attribute__((target("neon"))) uint8x8_t vcgez_s8(int8x8_t __p0) { 46675 uint8x8_t __ret; 46676 __ret = (uint8x8_t) __builtin_neon_vcgez_v((int8x8_t)__p0, 16); 46677 return __ret; 46678 } 46679 #else 46680 __ai __attribute__((target("neon"))) uint8x8_t vcgez_s8(int8x8_t __p0) { 46681 uint8x8_t __ret; 46682 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 46683 __ret = (uint8x8_t) __builtin_neon_vcgez_v((int8x8_t)__rev0, 16); 46684 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 46685 return __ret; 46686 } 46687 #endif 46688 46689 __ai __attribute__((target("neon"))) uint64x1_t vcgez_f64(float64x1_t __p0) { 46690 uint64x1_t __ret; 46691 __ret = (uint64x1_t) __builtin_neon_vcgez_v((int8x8_t)__p0, 19); 46692 return __ret; 46693 } 46694 #ifdef __LITTLE_ENDIAN__ 46695 __ai __attribute__((target("neon"))) uint32x2_t vcgez_f32(float32x2_t __p0) { 46696 uint32x2_t __ret; 46697 __ret = (uint32x2_t) __builtin_neon_vcgez_v((int8x8_t)__p0, 18); 46698 return __ret; 46699 } 46700 #else 46701 __ai __attribute__((target("neon"))) uint32x2_t vcgez_f32(float32x2_t __p0) { 46702 uint32x2_t __ret; 46703 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 46704 __ret = (uint32x2_t) __builtin_neon_vcgez_v((int8x8_t)__rev0, 18); 46705 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 46706 return __ret; 46707 } 46708 #endif 46709 46710 #ifdef __LITTLE_ENDIAN__ 46711 __ai __attribute__((target("neon"))) uint32x2_t vcgez_s32(int32x2_t __p0) { 46712 uint32x2_t __ret; 46713 __ret = (uint32x2_t) __builtin_neon_vcgez_v((int8x8_t)__p0, 18); 46714 return __ret; 46715 } 46716 #else 46717 __ai __attribute__((target("neon"))) uint32x2_t vcgez_s32(int32x2_t __p0) { 46718 uint32x2_t __ret; 46719 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 46720 __ret = (uint32x2_t) __builtin_neon_vcgez_v((int8x8_t)__rev0, 18); 46721 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 46722 return __ret; 46723 } 46724 #endif 46725 46726 __ai __attribute__((target("neon"))) uint64x1_t vcgez_s64(int64x1_t __p0) { 46727 uint64x1_t __ret; 46728 __ret = (uint64x1_t) __builtin_neon_vcgez_v((int8x8_t)__p0, 19); 46729 return __ret; 46730 } 46731 #ifdef __LITTLE_ENDIAN__ 46732 __ai __attribute__((target("neon"))) uint16x4_t vcgez_s16(int16x4_t __p0) { 46733 uint16x4_t __ret; 46734 __ret = (uint16x4_t) __builtin_neon_vcgez_v((int8x8_t)__p0, 17); 46735 return __ret; 46736 } 46737 #else 46738 __ai __attribute__((target("neon"))) uint16x4_t vcgez_s16(int16x4_t __p0) { 46739 uint16x4_t __ret; 46740 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 46741 __ret = (uint16x4_t) __builtin_neon_vcgez_v((int8x8_t)__rev0, 17); 46742 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 46743 return __ret; 46744 } 46745 #endif 46746 46747 __ai __attribute__((target("neon"))) uint64_t vcgezd_s64(int64_t __p0) { 46748 uint64_t __ret; 46749 __ret = (uint64_t) __builtin_neon_vcgezd_s64(__p0); 46750 return __ret; 46751 } 46752 __ai __attribute__((target("neon"))) uint64_t vcgezd_f64(float64_t __p0) { 46753 uint64_t __ret; 46754 __ret = (uint64_t) __builtin_neon_vcgezd_f64(__p0); 46755 return __ret; 46756 } 46757 __ai __attribute__((target("neon"))) uint32_t vcgezs_f32(float32_t __p0) { 46758 uint32_t __ret; 46759 __ret = (uint32_t) __builtin_neon_vcgezs_f32(__p0); 46760 return __ret; 46761 } 46762 #ifdef __LITTLE_ENDIAN__ 46763 __ai __attribute__((target("neon"))) uint64x2_t vcgtq_u64(uint64x2_t __p0, uint64x2_t __p1) { 46764 uint64x2_t __ret; 46765 __ret = (uint64x2_t)(__p0 > __p1); 46766 return __ret; 46767 } 46768 #else 46769 __ai __attribute__((target("neon"))) uint64x2_t vcgtq_u64(uint64x2_t __p0, uint64x2_t __p1) { 46770 uint64x2_t __ret; 46771 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 46772 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 46773 __ret = (uint64x2_t)(__rev0 > __rev1); 46774 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 46775 return __ret; 46776 } 46777 #endif 46778 46779 #ifdef __LITTLE_ENDIAN__ 46780 __ai __attribute__((target("neon"))) uint64x2_t vcgtq_f64(float64x2_t __p0, float64x2_t __p1) { 46781 uint64x2_t __ret; 46782 __ret = (uint64x2_t)(__p0 > __p1); 46783 return __ret; 46784 } 46785 #else 46786 __ai __attribute__((target("neon"))) uint64x2_t vcgtq_f64(float64x2_t __p0, float64x2_t __p1) { 46787 uint64x2_t __ret; 46788 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 46789 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 46790 __ret = (uint64x2_t)(__rev0 > __rev1); 46791 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 46792 return __ret; 46793 } 46794 #endif 46795 46796 #ifdef __LITTLE_ENDIAN__ 46797 __ai __attribute__((target("neon"))) uint64x2_t vcgtq_s64(int64x2_t __p0, int64x2_t __p1) { 46798 uint64x2_t __ret; 46799 __ret = (uint64x2_t)(__p0 > __p1); 46800 return __ret; 46801 } 46802 #else 46803 __ai __attribute__((target("neon"))) uint64x2_t vcgtq_s64(int64x2_t __p0, int64x2_t __p1) { 46804 uint64x2_t __ret; 46805 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 46806 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 46807 __ret = (uint64x2_t)(__rev0 > __rev1); 46808 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 46809 return __ret; 46810 } 46811 #endif 46812 46813 __ai __attribute__((target("neon"))) uint64x1_t vcgt_u64(uint64x1_t __p0, uint64x1_t __p1) { 46814 uint64x1_t __ret; 46815 __ret = (uint64x1_t)(__p0 > __p1); 46816 return __ret; 46817 } 46818 __ai __attribute__((target("neon"))) uint64x1_t vcgt_f64(float64x1_t __p0, float64x1_t __p1) { 46819 uint64x1_t __ret; 46820 __ret = (uint64x1_t)(__p0 > __p1); 46821 return __ret; 46822 } 46823 __ai __attribute__((target("neon"))) uint64x1_t vcgt_s64(int64x1_t __p0, int64x1_t __p1) { 46824 uint64x1_t __ret; 46825 __ret = (uint64x1_t)(__p0 > __p1); 46826 return __ret; 46827 } 46828 __ai __attribute__((target("neon"))) uint64_t vcgtd_s64(int64_t __p0, int64_t __p1) { 46829 uint64_t __ret; 46830 __ret = (uint64_t) __builtin_neon_vcgtd_s64(__p0, __p1); 46831 return __ret; 46832 } 46833 __ai __attribute__((target("neon"))) uint64_t vcgtd_u64(uint64_t __p0, uint64_t __p1) { 46834 uint64_t __ret; 46835 __ret = (uint64_t) __builtin_neon_vcgtd_u64(__p0, __p1); 46836 return __ret; 46837 } 46838 __ai __attribute__((target("neon"))) uint64_t vcgtd_f64(float64_t __p0, float64_t __p1) { 46839 uint64_t __ret; 46840 __ret = (uint64_t) __builtin_neon_vcgtd_f64(__p0, __p1); 46841 return __ret; 46842 } 46843 __ai __attribute__((target("neon"))) uint32_t vcgts_f32(float32_t __p0, float32_t __p1) { 46844 uint32_t __ret; 46845 __ret = (uint32_t) __builtin_neon_vcgts_f32(__p0, __p1); 46846 return __ret; 46847 } 46848 #ifdef __LITTLE_ENDIAN__ 46849 __ai __attribute__((target("neon"))) uint8x16_t vcgtzq_s8(int8x16_t __p0) { 46850 uint8x16_t __ret; 46851 __ret = (uint8x16_t) __builtin_neon_vcgtzq_v((int8x16_t)__p0, 48); 46852 return __ret; 46853 } 46854 #else 46855 __ai __attribute__((target("neon"))) uint8x16_t vcgtzq_s8(int8x16_t __p0) { 46856 uint8x16_t __ret; 46857 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 46858 __ret = (uint8x16_t) __builtin_neon_vcgtzq_v((int8x16_t)__rev0, 48); 46859 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 46860 return __ret; 46861 } 46862 #endif 46863 46864 #ifdef __LITTLE_ENDIAN__ 46865 __ai __attribute__((target("neon"))) uint64x2_t vcgtzq_f64(float64x2_t __p0) { 46866 uint64x2_t __ret; 46867 __ret = (uint64x2_t) __builtin_neon_vcgtzq_v((int8x16_t)__p0, 51); 46868 return __ret; 46869 } 46870 #else 46871 __ai __attribute__((target("neon"))) uint64x2_t vcgtzq_f64(float64x2_t __p0) { 46872 uint64x2_t __ret; 46873 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 46874 __ret = (uint64x2_t) __builtin_neon_vcgtzq_v((int8x16_t)__rev0, 51); 46875 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 46876 return __ret; 46877 } 46878 #endif 46879 46880 #ifdef __LITTLE_ENDIAN__ 46881 __ai __attribute__((target("neon"))) uint32x4_t vcgtzq_f32(float32x4_t __p0) { 46882 uint32x4_t __ret; 46883 __ret = (uint32x4_t) __builtin_neon_vcgtzq_v((int8x16_t)__p0, 50); 46884 return __ret; 46885 } 46886 #else 46887 __ai __attribute__((target("neon"))) uint32x4_t vcgtzq_f32(float32x4_t __p0) { 46888 uint32x4_t __ret; 46889 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 46890 __ret = (uint32x4_t) __builtin_neon_vcgtzq_v((int8x16_t)__rev0, 50); 46891 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 46892 return __ret; 46893 } 46894 #endif 46895 46896 #ifdef __LITTLE_ENDIAN__ 46897 __ai __attribute__((target("neon"))) uint32x4_t vcgtzq_s32(int32x4_t __p0) { 46898 uint32x4_t __ret; 46899 __ret = (uint32x4_t) __builtin_neon_vcgtzq_v((int8x16_t)__p0, 50); 46900 return __ret; 46901 } 46902 #else 46903 __ai __attribute__((target("neon"))) uint32x4_t vcgtzq_s32(int32x4_t __p0) { 46904 uint32x4_t __ret; 46905 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 46906 __ret = (uint32x4_t) __builtin_neon_vcgtzq_v((int8x16_t)__rev0, 50); 46907 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 46908 return __ret; 46909 } 46910 #endif 46911 46912 #ifdef __LITTLE_ENDIAN__ 46913 __ai __attribute__((target("neon"))) uint64x2_t vcgtzq_s64(int64x2_t __p0) { 46914 uint64x2_t __ret; 46915 __ret = (uint64x2_t) __builtin_neon_vcgtzq_v((int8x16_t)__p0, 51); 46916 return __ret; 46917 } 46918 #else 46919 __ai __attribute__((target("neon"))) uint64x2_t vcgtzq_s64(int64x2_t __p0) { 46920 uint64x2_t __ret; 46921 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 46922 __ret = (uint64x2_t) __builtin_neon_vcgtzq_v((int8x16_t)__rev0, 51); 46923 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 46924 return __ret; 46925 } 46926 #endif 46927 46928 #ifdef __LITTLE_ENDIAN__ 46929 __ai __attribute__((target("neon"))) uint16x8_t vcgtzq_s16(int16x8_t __p0) { 46930 uint16x8_t __ret; 46931 __ret = (uint16x8_t) __builtin_neon_vcgtzq_v((int8x16_t)__p0, 49); 46932 return __ret; 46933 } 46934 #else 46935 __ai __attribute__((target("neon"))) uint16x8_t vcgtzq_s16(int16x8_t __p0) { 46936 uint16x8_t __ret; 46937 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 46938 __ret = (uint16x8_t) __builtin_neon_vcgtzq_v((int8x16_t)__rev0, 49); 46939 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 46940 return __ret; 46941 } 46942 #endif 46943 46944 #ifdef __LITTLE_ENDIAN__ 46945 __ai __attribute__((target("neon"))) uint8x8_t vcgtz_s8(int8x8_t __p0) { 46946 uint8x8_t __ret; 46947 __ret = (uint8x8_t) __builtin_neon_vcgtz_v((int8x8_t)__p0, 16); 46948 return __ret; 46949 } 46950 #else 46951 __ai __attribute__((target("neon"))) uint8x8_t vcgtz_s8(int8x8_t __p0) { 46952 uint8x8_t __ret; 46953 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 46954 __ret = (uint8x8_t) __builtin_neon_vcgtz_v((int8x8_t)__rev0, 16); 46955 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 46956 return __ret; 46957 } 46958 #endif 46959 46960 __ai __attribute__((target("neon"))) uint64x1_t vcgtz_f64(float64x1_t __p0) { 46961 uint64x1_t __ret; 46962 __ret = (uint64x1_t) __builtin_neon_vcgtz_v((int8x8_t)__p0, 19); 46963 return __ret; 46964 } 46965 #ifdef __LITTLE_ENDIAN__ 46966 __ai __attribute__((target("neon"))) uint32x2_t vcgtz_f32(float32x2_t __p0) { 46967 uint32x2_t __ret; 46968 __ret = (uint32x2_t) __builtin_neon_vcgtz_v((int8x8_t)__p0, 18); 46969 return __ret; 46970 } 46971 #else 46972 __ai __attribute__((target("neon"))) uint32x2_t vcgtz_f32(float32x2_t __p0) { 46973 uint32x2_t __ret; 46974 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 46975 __ret = (uint32x2_t) __builtin_neon_vcgtz_v((int8x8_t)__rev0, 18); 46976 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 46977 return __ret; 46978 } 46979 #endif 46980 46981 #ifdef __LITTLE_ENDIAN__ 46982 __ai __attribute__((target("neon"))) uint32x2_t vcgtz_s32(int32x2_t __p0) { 46983 uint32x2_t __ret; 46984 __ret = (uint32x2_t) __builtin_neon_vcgtz_v((int8x8_t)__p0, 18); 46985 return __ret; 46986 } 46987 #else 46988 __ai __attribute__((target("neon"))) uint32x2_t vcgtz_s32(int32x2_t __p0) { 46989 uint32x2_t __ret; 46990 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 46991 __ret = (uint32x2_t) __builtin_neon_vcgtz_v((int8x8_t)__rev0, 18); 46992 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 46993 return __ret; 46994 } 46995 #endif 46996 46997 __ai __attribute__((target("neon"))) uint64x1_t vcgtz_s64(int64x1_t __p0) { 46998 uint64x1_t __ret; 46999 __ret = (uint64x1_t) __builtin_neon_vcgtz_v((int8x8_t)__p0, 19); 47000 return __ret; 47001 } 47002 #ifdef __LITTLE_ENDIAN__ 47003 __ai __attribute__((target("neon"))) uint16x4_t vcgtz_s16(int16x4_t __p0) { 47004 uint16x4_t __ret; 47005 __ret = (uint16x4_t) __builtin_neon_vcgtz_v((int8x8_t)__p0, 17); 47006 return __ret; 47007 } 47008 #else 47009 __ai __attribute__((target("neon"))) uint16x4_t vcgtz_s16(int16x4_t __p0) { 47010 uint16x4_t __ret; 47011 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 47012 __ret = (uint16x4_t) __builtin_neon_vcgtz_v((int8x8_t)__rev0, 17); 47013 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 47014 return __ret; 47015 } 47016 #endif 47017 47018 __ai __attribute__((target("neon"))) uint64_t vcgtzd_s64(int64_t __p0) { 47019 uint64_t __ret; 47020 __ret = (uint64_t) __builtin_neon_vcgtzd_s64(__p0); 47021 return __ret; 47022 } 47023 __ai __attribute__((target("neon"))) uint64_t vcgtzd_f64(float64_t __p0) { 47024 uint64_t __ret; 47025 __ret = (uint64_t) __builtin_neon_vcgtzd_f64(__p0); 47026 return __ret; 47027 } 47028 __ai __attribute__((target("neon"))) uint32_t vcgtzs_f32(float32_t __p0) { 47029 uint32_t __ret; 47030 __ret = (uint32_t) __builtin_neon_vcgtzs_f32(__p0); 47031 return __ret; 47032 } 47033 #ifdef __LITTLE_ENDIAN__ 47034 __ai __attribute__((target("neon"))) uint64x2_t vcleq_u64(uint64x2_t __p0, uint64x2_t __p1) { 47035 uint64x2_t __ret; 47036 __ret = (uint64x2_t)(__p0 <= __p1); 47037 return __ret; 47038 } 47039 #else 47040 __ai __attribute__((target("neon"))) uint64x2_t vcleq_u64(uint64x2_t __p0, uint64x2_t __p1) { 47041 uint64x2_t __ret; 47042 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 47043 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 47044 __ret = (uint64x2_t)(__rev0 <= __rev1); 47045 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 47046 return __ret; 47047 } 47048 #endif 47049 47050 #ifdef __LITTLE_ENDIAN__ 47051 __ai __attribute__((target("neon"))) uint64x2_t vcleq_f64(float64x2_t __p0, float64x2_t __p1) { 47052 uint64x2_t __ret; 47053 __ret = (uint64x2_t)(__p0 <= __p1); 47054 return __ret; 47055 } 47056 #else 47057 __ai __attribute__((target("neon"))) uint64x2_t vcleq_f64(float64x2_t __p0, float64x2_t __p1) { 47058 uint64x2_t __ret; 47059 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 47060 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 47061 __ret = (uint64x2_t)(__rev0 <= __rev1); 47062 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 47063 return __ret; 47064 } 47065 #endif 47066 47067 #ifdef __LITTLE_ENDIAN__ 47068 __ai __attribute__((target("neon"))) uint64x2_t vcleq_s64(int64x2_t __p0, int64x2_t __p1) { 47069 uint64x2_t __ret; 47070 __ret = (uint64x2_t)(__p0 <= __p1); 47071 return __ret; 47072 } 47073 #else 47074 __ai __attribute__((target("neon"))) uint64x2_t vcleq_s64(int64x2_t __p0, int64x2_t __p1) { 47075 uint64x2_t __ret; 47076 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 47077 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 47078 __ret = (uint64x2_t)(__rev0 <= __rev1); 47079 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 47080 return __ret; 47081 } 47082 #endif 47083 47084 __ai __attribute__((target("neon"))) uint64x1_t vcle_u64(uint64x1_t __p0, uint64x1_t __p1) { 47085 uint64x1_t __ret; 47086 __ret = (uint64x1_t)(__p0 <= __p1); 47087 return __ret; 47088 } 47089 __ai __attribute__((target("neon"))) uint64x1_t vcle_f64(float64x1_t __p0, float64x1_t __p1) { 47090 uint64x1_t __ret; 47091 __ret = (uint64x1_t)(__p0 <= __p1); 47092 return __ret; 47093 } 47094 __ai __attribute__((target("neon"))) uint64x1_t vcle_s64(int64x1_t __p0, int64x1_t __p1) { 47095 uint64x1_t __ret; 47096 __ret = (uint64x1_t)(__p0 <= __p1); 47097 return __ret; 47098 } 47099 __ai __attribute__((target("neon"))) uint64_t vcled_u64(uint64_t __p0, uint64_t __p1) { 47100 uint64_t __ret; 47101 __ret = (uint64_t) __builtin_neon_vcled_u64(__p0, __p1); 47102 return __ret; 47103 } 47104 __ai __attribute__((target("neon"))) uint64_t vcled_s64(int64_t __p0, int64_t __p1) { 47105 uint64_t __ret; 47106 __ret = (uint64_t) __builtin_neon_vcled_s64(__p0, __p1); 47107 return __ret; 47108 } 47109 __ai __attribute__((target("neon"))) uint64_t vcled_f64(float64_t __p0, float64_t __p1) { 47110 uint64_t __ret; 47111 __ret = (uint64_t) __builtin_neon_vcled_f64(__p0, __p1); 47112 return __ret; 47113 } 47114 __ai __attribute__((target("neon"))) uint32_t vcles_f32(float32_t __p0, float32_t __p1) { 47115 uint32_t __ret; 47116 __ret = (uint32_t) __builtin_neon_vcles_f32(__p0, __p1); 47117 return __ret; 47118 } 47119 #ifdef __LITTLE_ENDIAN__ 47120 __ai __attribute__((target("neon"))) uint8x16_t vclezq_s8(int8x16_t __p0) { 47121 uint8x16_t __ret; 47122 __ret = (uint8x16_t) __builtin_neon_vclezq_v((int8x16_t)__p0, 48); 47123 return __ret; 47124 } 47125 #else 47126 __ai __attribute__((target("neon"))) uint8x16_t vclezq_s8(int8x16_t __p0) { 47127 uint8x16_t __ret; 47128 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 47129 __ret = (uint8x16_t) __builtin_neon_vclezq_v((int8x16_t)__rev0, 48); 47130 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 47131 return __ret; 47132 } 47133 #endif 47134 47135 #ifdef __LITTLE_ENDIAN__ 47136 __ai __attribute__((target("neon"))) uint64x2_t vclezq_f64(float64x2_t __p0) { 47137 uint64x2_t __ret; 47138 __ret = (uint64x2_t) __builtin_neon_vclezq_v((int8x16_t)__p0, 51); 47139 return __ret; 47140 } 47141 #else 47142 __ai __attribute__((target("neon"))) uint64x2_t vclezq_f64(float64x2_t __p0) { 47143 uint64x2_t __ret; 47144 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 47145 __ret = (uint64x2_t) __builtin_neon_vclezq_v((int8x16_t)__rev0, 51); 47146 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 47147 return __ret; 47148 } 47149 #endif 47150 47151 #ifdef __LITTLE_ENDIAN__ 47152 __ai __attribute__((target("neon"))) uint32x4_t vclezq_f32(float32x4_t __p0) { 47153 uint32x4_t __ret; 47154 __ret = (uint32x4_t) __builtin_neon_vclezq_v((int8x16_t)__p0, 50); 47155 return __ret; 47156 } 47157 #else 47158 __ai __attribute__((target("neon"))) uint32x4_t vclezq_f32(float32x4_t __p0) { 47159 uint32x4_t __ret; 47160 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 47161 __ret = (uint32x4_t) __builtin_neon_vclezq_v((int8x16_t)__rev0, 50); 47162 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 47163 return __ret; 47164 } 47165 #endif 47166 47167 #ifdef __LITTLE_ENDIAN__ 47168 __ai __attribute__((target("neon"))) uint32x4_t vclezq_s32(int32x4_t __p0) { 47169 uint32x4_t __ret; 47170 __ret = (uint32x4_t) __builtin_neon_vclezq_v((int8x16_t)__p0, 50); 47171 return __ret; 47172 } 47173 #else 47174 __ai __attribute__((target("neon"))) uint32x4_t vclezq_s32(int32x4_t __p0) { 47175 uint32x4_t __ret; 47176 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 47177 __ret = (uint32x4_t) __builtin_neon_vclezq_v((int8x16_t)__rev0, 50); 47178 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 47179 return __ret; 47180 } 47181 #endif 47182 47183 #ifdef __LITTLE_ENDIAN__ 47184 __ai __attribute__((target("neon"))) uint64x2_t vclezq_s64(int64x2_t __p0) { 47185 uint64x2_t __ret; 47186 __ret = (uint64x2_t) __builtin_neon_vclezq_v((int8x16_t)__p0, 51); 47187 return __ret; 47188 } 47189 #else 47190 __ai __attribute__((target("neon"))) uint64x2_t vclezq_s64(int64x2_t __p0) { 47191 uint64x2_t __ret; 47192 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 47193 __ret = (uint64x2_t) __builtin_neon_vclezq_v((int8x16_t)__rev0, 51); 47194 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 47195 return __ret; 47196 } 47197 #endif 47198 47199 #ifdef __LITTLE_ENDIAN__ 47200 __ai __attribute__((target("neon"))) uint16x8_t vclezq_s16(int16x8_t __p0) { 47201 uint16x8_t __ret; 47202 __ret = (uint16x8_t) __builtin_neon_vclezq_v((int8x16_t)__p0, 49); 47203 return __ret; 47204 } 47205 #else 47206 __ai __attribute__((target("neon"))) uint16x8_t vclezq_s16(int16x8_t __p0) { 47207 uint16x8_t __ret; 47208 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 47209 __ret = (uint16x8_t) __builtin_neon_vclezq_v((int8x16_t)__rev0, 49); 47210 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 47211 return __ret; 47212 } 47213 #endif 47214 47215 #ifdef __LITTLE_ENDIAN__ 47216 __ai __attribute__((target("neon"))) uint8x8_t vclez_s8(int8x8_t __p0) { 47217 uint8x8_t __ret; 47218 __ret = (uint8x8_t) __builtin_neon_vclez_v((int8x8_t)__p0, 16); 47219 return __ret; 47220 } 47221 #else 47222 __ai __attribute__((target("neon"))) uint8x8_t vclez_s8(int8x8_t __p0) { 47223 uint8x8_t __ret; 47224 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 47225 __ret = (uint8x8_t) __builtin_neon_vclez_v((int8x8_t)__rev0, 16); 47226 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 47227 return __ret; 47228 } 47229 #endif 47230 47231 __ai __attribute__((target("neon"))) uint64x1_t vclez_f64(float64x1_t __p0) { 47232 uint64x1_t __ret; 47233 __ret = (uint64x1_t) __builtin_neon_vclez_v((int8x8_t)__p0, 19); 47234 return __ret; 47235 } 47236 #ifdef __LITTLE_ENDIAN__ 47237 __ai __attribute__((target("neon"))) uint32x2_t vclez_f32(float32x2_t __p0) { 47238 uint32x2_t __ret; 47239 __ret = (uint32x2_t) __builtin_neon_vclez_v((int8x8_t)__p0, 18); 47240 return __ret; 47241 } 47242 #else 47243 __ai __attribute__((target("neon"))) uint32x2_t vclez_f32(float32x2_t __p0) { 47244 uint32x2_t __ret; 47245 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 47246 __ret = (uint32x2_t) __builtin_neon_vclez_v((int8x8_t)__rev0, 18); 47247 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 47248 return __ret; 47249 } 47250 #endif 47251 47252 #ifdef __LITTLE_ENDIAN__ 47253 __ai __attribute__((target("neon"))) uint32x2_t vclez_s32(int32x2_t __p0) { 47254 uint32x2_t __ret; 47255 __ret = (uint32x2_t) __builtin_neon_vclez_v((int8x8_t)__p0, 18); 47256 return __ret; 47257 } 47258 #else 47259 __ai __attribute__((target("neon"))) uint32x2_t vclez_s32(int32x2_t __p0) { 47260 uint32x2_t __ret; 47261 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 47262 __ret = (uint32x2_t) __builtin_neon_vclez_v((int8x8_t)__rev0, 18); 47263 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 47264 return __ret; 47265 } 47266 #endif 47267 47268 __ai __attribute__((target("neon"))) uint64x1_t vclez_s64(int64x1_t __p0) { 47269 uint64x1_t __ret; 47270 __ret = (uint64x1_t) __builtin_neon_vclez_v((int8x8_t)__p0, 19); 47271 return __ret; 47272 } 47273 #ifdef __LITTLE_ENDIAN__ 47274 __ai __attribute__((target("neon"))) uint16x4_t vclez_s16(int16x4_t __p0) { 47275 uint16x4_t __ret; 47276 __ret = (uint16x4_t) __builtin_neon_vclez_v((int8x8_t)__p0, 17); 47277 return __ret; 47278 } 47279 #else 47280 __ai __attribute__((target("neon"))) uint16x4_t vclez_s16(int16x4_t __p0) { 47281 uint16x4_t __ret; 47282 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 47283 __ret = (uint16x4_t) __builtin_neon_vclez_v((int8x8_t)__rev0, 17); 47284 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 47285 return __ret; 47286 } 47287 #endif 47288 47289 __ai __attribute__((target("neon"))) uint64_t vclezd_s64(int64_t __p0) { 47290 uint64_t __ret; 47291 __ret = (uint64_t) __builtin_neon_vclezd_s64(__p0); 47292 return __ret; 47293 } 47294 __ai __attribute__((target("neon"))) uint64_t vclezd_f64(float64_t __p0) { 47295 uint64_t __ret; 47296 __ret = (uint64_t) __builtin_neon_vclezd_f64(__p0); 47297 return __ret; 47298 } 47299 __ai __attribute__((target("neon"))) uint32_t vclezs_f32(float32_t __p0) { 47300 uint32_t __ret; 47301 __ret = (uint32_t) __builtin_neon_vclezs_f32(__p0); 47302 return __ret; 47303 } 47304 #ifdef __LITTLE_ENDIAN__ 47305 __ai __attribute__((target("neon"))) uint64x2_t vcltq_u64(uint64x2_t __p0, uint64x2_t __p1) { 47306 uint64x2_t __ret; 47307 __ret = (uint64x2_t)(__p0 < __p1); 47308 return __ret; 47309 } 47310 #else 47311 __ai __attribute__((target("neon"))) uint64x2_t vcltq_u64(uint64x2_t __p0, uint64x2_t __p1) { 47312 uint64x2_t __ret; 47313 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 47314 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 47315 __ret = (uint64x2_t)(__rev0 < __rev1); 47316 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 47317 return __ret; 47318 } 47319 #endif 47320 47321 #ifdef __LITTLE_ENDIAN__ 47322 __ai __attribute__((target("neon"))) uint64x2_t vcltq_f64(float64x2_t __p0, float64x2_t __p1) { 47323 uint64x2_t __ret; 47324 __ret = (uint64x2_t)(__p0 < __p1); 47325 return __ret; 47326 } 47327 #else 47328 __ai __attribute__((target("neon"))) uint64x2_t vcltq_f64(float64x2_t __p0, float64x2_t __p1) { 47329 uint64x2_t __ret; 47330 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 47331 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 47332 __ret = (uint64x2_t)(__rev0 < __rev1); 47333 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 47334 return __ret; 47335 } 47336 #endif 47337 47338 #ifdef __LITTLE_ENDIAN__ 47339 __ai __attribute__((target("neon"))) uint64x2_t vcltq_s64(int64x2_t __p0, int64x2_t __p1) { 47340 uint64x2_t __ret; 47341 __ret = (uint64x2_t)(__p0 < __p1); 47342 return __ret; 47343 } 47344 #else 47345 __ai __attribute__((target("neon"))) uint64x2_t vcltq_s64(int64x2_t __p0, int64x2_t __p1) { 47346 uint64x2_t __ret; 47347 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 47348 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 47349 __ret = (uint64x2_t)(__rev0 < __rev1); 47350 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 47351 return __ret; 47352 } 47353 #endif 47354 47355 __ai __attribute__((target("neon"))) uint64x1_t vclt_u64(uint64x1_t __p0, uint64x1_t __p1) { 47356 uint64x1_t __ret; 47357 __ret = (uint64x1_t)(__p0 < __p1); 47358 return __ret; 47359 } 47360 __ai __attribute__((target("neon"))) uint64x1_t vclt_f64(float64x1_t __p0, float64x1_t __p1) { 47361 uint64x1_t __ret; 47362 __ret = (uint64x1_t)(__p0 < __p1); 47363 return __ret; 47364 } 47365 __ai __attribute__((target("neon"))) uint64x1_t vclt_s64(int64x1_t __p0, int64x1_t __p1) { 47366 uint64x1_t __ret; 47367 __ret = (uint64x1_t)(__p0 < __p1); 47368 return __ret; 47369 } 47370 __ai __attribute__((target("neon"))) uint64_t vcltd_u64(uint64_t __p0, uint64_t __p1) { 47371 uint64_t __ret; 47372 __ret = (uint64_t) __builtin_neon_vcltd_u64(__p0, __p1); 47373 return __ret; 47374 } 47375 __ai __attribute__((target("neon"))) uint64_t vcltd_s64(int64_t __p0, int64_t __p1) { 47376 uint64_t __ret; 47377 __ret = (uint64_t) __builtin_neon_vcltd_s64(__p0, __p1); 47378 return __ret; 47379 } 47380 __ai __attribute__((target("neon"))) uint64_t vcltd_f64(float64_t __p0, float64_t __p1) { 47381 uint64_t __ret; 47382 __ret = (uint64_t) __builtin_neon_vcltd_f64(__p0, __p1); 47383 return __ret; 47384 } 47385 __ai __attribute__((target("neon"))) uint32_t vclts_f32(float32_t __p0, float32_t __p1) { 47386 uint32_t __ret; 47387 __ret = (uint32_t) __builtin_neon_vclts_f32(__p0, __p1); 47388 return __ret; 47389 } 47390 #ifdef __LITTLE_ENDIAN__ 47391 __ai __attribute__((target("neon"))) uint8x16_t vcltzq_s8(int8x16_t __p0) { 47392 uint8x16_t __ret; 47393 __ret = (uint8x16_t) __builtin_neon_vcltzq_v((int8x16_t)__p0, 48); 47394 return __ret; 47395 } 47396 #else 47397 __ai __attribute__((target("neon"))) uint8x16_t vcltzq_s8(int8x16_t __p0) { 47398 uint8x16_t __ret; 47399 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 47400 __ret = (uint8x16_t) __builtin_neon_vcltzq_v((int8x16_t)__rev0, 48); 47401 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 47402 return __ret; 47403 } 47404 #endif 47405 47406 #ifdef __LITTLE_ENDIAN__ 47407 __ai __attribute__((target("neon"))) uint64x2_t vcltzq_f64(float64x2_t __p0) { 47408 uint64x2_t __ret; 47409 __ret = (uint64x2_t) __builtin_neon_vcltzq_v((int8x16_t)__p0, 51); 47410 return __ret; 47411 } 47412 #else 47413 __ai __attribute__((target("neon"))) uint64x2_t vcltzq_f64(float64x2_t __p0) { 47414 uint64x2_t __ret; 47415 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 47416 __ret = (uint64x2_t) __builtin_neon_vcltzq_v((int8x16_t)__rev0, 51); 47417 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 47418 return __ret; 47419 } 47420 #endif 47421 47422 #ifdef __LITTLE_ENDIAN__ 47423 __ai __attribute__((target("neon"))) uint32x4_t vcltzq_f32(float32x4_t __p0) { 47424 uint32x4_t __ret; 47425 __ret = (uint32x4_t) __builtin_neon_vcltzq_v((int8x16_t)__p0, 50); 47426 return __ret; 47427 } 47428 #else 47429 __ai __attribute__((target("neon"))) uint32x4_t vcltzq_f32(float32x4_t __p0) { 47430 uint32x4_t __ret; 47431 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 47432 __ret = (uint32x4_t) __builtin_neon_vcltzq_v((int8x16_t)__rev0, 50); 47433 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 47434 return __ret; 47435 } 47436 #endif 47437 47438 #ifdef __LITTLE_ENDIAN__ 47439 __ai __attribute__((target("neon"))) uint32x4_t vcltzq_s32(int32x4_t __p0) { 47440 uint32x4_t __ret; 47441 __ret = (uint32x4_t) __builtin_neon_vcltzq_v((int8x16_t)__p0, 50); 47442 return __ret; 47443 } 47444 #else 47445 __ai __attribute__((target("neon"))) uint32x4_t vcltzq_s32(int32x4_t __p0) { 47446 uint32x4_t __ret; 47447 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 47448 __ret = (uint32x4_t) __builtin_neon_vcltzq_v((int8x16_t)__rev0, 50); 47449 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 47450 return __ret; 47451 } 47452 #endif 47453 47454 #ifdef __LITTLE_ENDIAN__ 47455 __ai __attribute__((target("neon"))) uint64x2_t vcltzq_s64(int64x2_t __p0) { 47456 uint64x2_t __ret; 47457 __ret = (uint64x2_t) __builtin_neon_vcltzq_v((int8x16_t)__p0, 51); 47458 return __ret; 47459 } 47460 #else 47461 __ai __attribute__((target("neon"))) uint64x2_t vcltzq_s64(int64x2_t __p0) { 47462 uint64x2_t __ret; 47463 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 47464 __ret = (uint64x2_t) __builtin_neon_vcltzq_v((int8x16_t)__rev0, 51); 47465 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 47466 return __ret; 47467 } 47468 #endif 47469 47470 #ifdef __LITTLE_ENDIAN__ 47471 __ai __attribute__((target("neon"))) uint16x8_t vcltzq_s16(int16x8_t __p0) { 47472 uint16x8_t __ret; 47473 __ret = (uint16x8_t) __builtin_neon_vcltzq_v((int8x16_t)__p0, 49); 47474 return __ret; 47475 } 47476 #else 47477 __ai __attribute__((target("neon"))) uint16x8_t vcltzq_s16(int16x8_t __p0) { 47478 uint16x8_t __ret; 47479 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 47480 __ret = (uint16x8_t) __builtin_neon_vcltzq_v((int8x16_t)__rev0, 49); 47481 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 47482 return __ret; 47483 } 47484 #endif 47485 47486 #ifdef __LITTLE_ENDIAN__ 47487 __ai __attribute__((target("neon"))) uint8x8_t vcltz_s8(int8x8_t __p0) { 47488 uint8x8_t __ret; 47489 __ret = (uint8x8_t) __builtin_neon_vcltz_v((int8x8_t)__p0, 16); 47490 return __ret; 47491 } 47492 #else 47493 __ai __attribute__((target("neon"))) uint8x8_t vcltz_s8(int8x8_t __p0) { 47494 uint8x8_t __ret; 47495 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 47496 __ret = (uint8x8_t) __builtin_neon_vcltz_v((int8x8_t)__rev0, 16); 47497 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 47498 return __ret; 47499 } 47500 #endif 47501 47502 __ai __attribute__((target("neon"))) uint64x1_t vcltz_f64(float64x1_t __p0) { 47503 uint64x1_t __ret; 47504 __ret = (uint64x1_t) __builtin_neon_vcltz_v((int8x8_t)__p0, 19); 47505 return __ret; 47506 } 47507 #ifdef __LITTLE_ENDIAN__ 47508 __ai __attribute__((target("neon"))) uint32x2_t vcltz_f32(float32x2_t __p0) { 47509 uint32x2_t __ret; 47510 __ret = (uint32x2_t) __builtin_neon_vcltz_v((int8x8_t)__p0, 18); 47511 return __ret; 47512 } 47513 #else 47514 __ai __attribute__((target("neon"))) uint32x2_t vcltz_f32(float32x2_t __p0) { 47515 uint32x2_t __ret; 47516 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 47517 __ret = (uint32x2_t) __builtin_neon_vcltz_v((int8x8_t)__rev0, 18); 47518 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 47519 return __ret; 47520 } 47521 #endif 47522 47523 #ifdef __LITTLE_ENDIAN__ 47524 __ai __attribute__((target("neon"))) uint32x2_t vcltz_s32(int32x2_t __p0) { 47525 uint32x2_t __ret; 47526 __ret = (uint32x2_t) __builtin_neon_vcltz_v((int8x8_t)__p0, 18); 47527 return __ret; 47528 } 47529 #else 47530 __ai __attribute__((target("neon"))) uint32x2_t vcltz_s32(int32x2_t __p0) { 47531 uint32x2_t __ret; 47532 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 47533 __ret = (uint32x2_t) __builtin_neon_vcltz_v((int8x8_t)__rev0, 18); 47534 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 47535 return __ret; 47536 } 47537 #endif 47538 47539 __ai __attribute__((target("neon"))) uint64x1_t vcltz_s64(int64x1_t __p0) { 47540 uint64x1_t __ret; 47541 __ret = (uint64x1_t) __builtin_neon_vcltz_v((int8x8_t)__p0, 19); 47542 return __ret; 47543 } 47544 #ifdef __LITTLE_ENDIAN__ 47545 __ai __attribute__((target("neon"))) uint16x4_t vcltz_s16(int16x4_t __p0) { 47546 uint16x4_t __ret; 47547 __ret = (uint16x4_t) __builtin_neon_vcltz_v((int8x8_t)__p0, 17); 47548 return __ret; 47549 } 47550 #else 47551 __ai __attribute__((target("neon"))) uint16x4_t vcltz_s16(int16x4_t __p0) { 47552 uint16x4_t __ret; 47553 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 47554 __ret = (uint16x4_t) __builtin_neon_vcltz_v((int8x8_t)__rev0, 17); 47555 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 47556 return __ret; 47557 } 47558 #endif 47559 47560 __ai __attribute__((target("neon"))) uint64_t vcltzd_s64(int64_t __p0) { 47561 uint64_t __ret; 47562 __ret = (uint64_t) __builtin_neon_vcltzd_s64(__p0); 47563 return __ret; 47564 } 47565 __ai __attribute__((target("neon"))) uint64_t vcltzd_f64(float64_t __p0) { 47566 uint64_t __ret; 47567 __ret = (uint64_t) __builtin_neon_vcltzd_f64(__p0); 47568 return __ret; 47569 } 47570 __ai __attribute__((target("neon"))) uint32_t vcltzs_f32(float32_t __p0) { 47571 uint32_t __ret; 47572 __ret = (uint32_t) __builtin_neon_vcltzs_f32(__p0); 47573 return __ret; 47574 } 47575 #ifdef __LITTLE_ENDIAN__ 47576 __ai __attribute__((target("neon"))) poly64x2_t vcombine_p64(poly64x1_t __p0, poly64x1_t __p1) { 47577 poly64x2_t __ret; 47578 __ret = __builtin_shufflevector(__p0, __p1, 0, 1); 47579 return __ret; 47580 } 47581 #else 47582 __ai __attribute__((target("neon"))) poly64x2_t vcombine_p64(poly64x1_t __p0, poly64x1_t __p1) { 47583 poly64x2_t __ret; 47584 __ret = __builtin_shufflevector(__p0, __p1, 0, 1); 47585 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 47586 return __ret; 47587 } 47588 #endif 47589 47590 #ifdef __LITTLE_ENDIAN__ 47591 __ai __attribute__((target("neon"))) float64x2_t vcombine_f64(float64x1_t __p0, float64x1_t __p1) { 47592 float64x2_t __ret; 47593 __ret = __builtin_shufflevector(__p0, __p1, 0, 1); 47594 return __ret; 47595 } 47596 #else 47597 __ai __attribute__((target("neon"))) float64x2_t vcombine_f64(float64x1_t __p0, float64x1_t __p1) { 47598 float64x2_t __ret; 47599 __ret = __builtin_shufflevector(__p0, __p1, 0, 1); 47600 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 47601 return __ret; 47602 } 47603 #endif 47604 47605 #ifdef __LITTLE_ENDIAN__ 47606 #define vcopyq_lane_p8(__p0_278, __p1_278, __p2_278, __p3_278) __extension__ ({ \ 47607 poly8x16_t __ret_278; \ 47608 poly8x16_t __s0_278 = __p0_278; \ 47609 poly8x8_t __s2_278 = __p2_278; \ 47610 __ret_278 = vsetq_lane_p8(vget_lane_p8(__s2_278, __p3_278), __s0_278, __p1_278); \ 47611 __ret_278; \ 47612 }) 47613 #else 47614 #define vcopyq_lane_p8(__p0_279, __p1_279, __p2_279, __p3_279) __extension__ ({ \ 47615 poly8x16_t __ret_279; \ 47616 poly8x16_t __s0_279 = __p0_279; \ 47617 poly8x8_t __s2_279 = __p2_279; \ 47618 poly8x16_t __rev0_279; __rev0_279 = __builtin_shufflevector(__s0_279, __s0_279, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 47619 poly8x8_t __rev2_279; __rev2_279 = __builtin_shufflevector(__s2_279, __s2_279, 7, 6, 5, 4, 3, 2, 1, 0); \ 47620 __ret_279 = __noswap_vsetq_lane_p8(__noswap_vget_lane_p8(__rev2_279, __p3_279), __rev0_279, __p1_279); \ 47621 __ret_279 = __builtin_shufflevector(__ret_279, __ret_279, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 47622 __ret_279; \ 47623 }) 47624 #endif 47625 47626 #ifdef __LITTLE_ENDIAN__ 47627 #define vcopyq_lane_p16(__p0_280, __p1_280, __p2_280, __p3_280) __extension__ ({ \ 47628 poly16x8_t __ret_280; \ 47629 poly16x8_t __s0_280 = __p0_280; \ 47630 poly16x4_t __s2_280 = __p2_280; \ 47631 __ret_280 = vsetq_lane_p16(vget_lane_p16(__s2_280, __p3_280), __s0_280, __p1_280); \ 47632 __ret_280; \ 47633 }) 47634 #else 47635 #define vcopyq_lane_p16(__p0_281, __p1_281, __p2_281, __p3_281) __extension__ ({ \ 47636 poly16x8_t __ret_281; \ 47637 poly16x8_t __s0_281 = __p0_281; \ 47638 poly16x4_t __s2_281 = __p2_281; \ 47639 poly16x8_t __rev0_281; __rev0_281 = __builtin_shufflevector(__s0_281, __s0_281, 7, 6, 5, 4, 3, 2, 1, 0); \ 47640 poly16x4_t __rev2_281; __rev2_281 = __builtin_shufflevector(__s2_281, __s2_281, 3, 2, 1, 0); \ 47641 __ret_281 = __noswap_vsetq_lane_p16(__noswap_vget_lane_p16(__rev2_281, __p3_281), __rev0_281, __p1_281); \ 47642 __ret_281 = __builtin_shufflevector(__ret_281, __ret_281, 7, 6, 5, 4, 3, 2, 1, 0); \ 47643 __ret_281; \ 47644 }) 47645 #endif 47646 47647 #ifdef __LITTLE_ENDIAN__ 47648 #define vcopyq_lane_u8(__p0_282, __p1_282, __p2_282, __p3_282) __extension__ ({ \ 47649 uint8x16_t __ret_282; \ 47650 uint8x16_t __s0_282 = __p0_282; \ 47651 uint8x8_t __s2_282 = __p2_282; \ 47652 __ret_282 = vsetq_lane_u8(vget_lane_u8(__s2_282, __p3_282), __s0_282, __p1_282); \ 47653 __ret_282; \ 47654 }) 47655 #else 47656 #define vcopyq_lane_u8(__p0_283, __p1_283, __p2_283, __p3_283) __extension__ ({ \ 47657 uint8x16_t __ret_283; \ 47658 uint8x16_t __s0_283 = __p0_283; \ 47659 uint8x8_t __s2_283 = __p2_283; \ 47660 uint8x16_t __rev0_283; __rev0_283 = __builtin_shufflevector(__s0_283, __s0_283, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 47661 uint8x8_t __rev2_283; __rev2_283 = __builtin_shufflevector(__s2_283, __s2_283, 7, 6, 5, 4, 3, 2, 1, 0); \ 47662 __ret_283 = __noswap_vsetq_lane_u8(__noswap_vget_lane_u8(__rev2_283, __p3_283), __rev0_283, __p1_283); \ 47663 __ret_283 = __builtin_shufflevector(__ret_283, __ret_283, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 47664 __ret_283; \ 47665 }) 47666 #endif 47667 47668 #ifdef __LITTLE_ENDIAN__ 47669 #define vcopyq_lane_u32(__p0_284, __p1_284, __p2_284, __p3_284) __extension__ ({ \ 47670 uint32x4_t __ret_284; \ 47671 uint32x4_t __s0_284 = __p0_284; \ 47672 uint32x2_t __s2_284 = __p2_284; \ 47673 __ret_284 = vsetq_lane_u32(vget_lane_u32(__s2_284, __p3_284), __s0_284, __p1_284); \ 47674 __ret_284; \ 47675 }) 47676 #else 47677 #define vcopyq_lane_u32(__p0_285, __p1_285, __p2_285, __p3_285) __extension__ ({ \ 47678 uint32x4_t __ret_285; \ 47679 uint32x4_t __s0_285 = __p0_285; \ 47680 uint32x2_t __s2_285 = __p2_285; \ 47681 uint32x4_t __rev0_285; __rev0_285 = __builtin_shufflevector(__s0_285, __s0_285, 3, 2, 1, 0); \ 47682 uint32x2_t __rev2_285; __rev2_285 = __builtin_shufflevector(__s2_285, __s2_285, 1, 0); \ 47683 __ret_285 = __noswap_vsetq_lane_u32(__noswap_vget_lane_u32(__rev2_285, __p3_285), __rev0_285, __p1_285); \ 47684 __ret_285 = __builtin_shufflevector(__ret_285, __ret_285, 3, 2, 1, 0); \ 47685 __ret_285; \ 47686 }) 47687 #endif 47688 47689 #ifdef __LITTLE_ENDIAN__ 47690 #define vcopyq_lane_u64(__p0_286, __p1_286, __p2_286, __p3_286) __extension__ ({ \ 47691 uint64x2_t __ret_286; \ 47692 uint64x2_t __s0_286 = __p0_286; \ 47693 uint64x1_t __s2_286 = __p2_286; \ 47694 __ret_286 = vsetq_lane_u64(vget_lane_u64(__s2_286, __p3_286), __s0_286, __p1_286); \ 47695 __ret_286; \ 47696 }) 47697 #else 47698 #define vcopyq_lane_u64(__p0_287, __p1_287, __p2_287, __p3_287) __extension__ ({ \ 47699 uint64x2_t __ret_287; \ 47700 uint64x2_t __s0_287 = __p0_287; \ 47701 uint64x1_t __s2_287 = __p2_287; \ 47702 uint64x2_t __rev0_287; __rev0_287 = __builtin_shufflevector(__s0_287, __s0_287, 1, 0); \ 47703 __ret_287 = __noswap_vsetq_lane_u64(vget_lane_u64(__s2_287, __p3_287), __rev0_287, __p1_287); \ 47704 __ret_287 = __builtin_shufflevector(__ret_287, __ret_287, 1, 0); \ 47705 __ret_287; \ 47706 }) 47707 #endif 47708 47709 #ifdef __LITTLE_ENDIAN__ 47710 #define vcopyq_lane_u16(__p0_288, __p1_288, __p2_288, __p3_288) __extension__ ({ \ 47711 uint16x8_t __ret_288; \ 47712 uint16x8_t __s0_288 = __p0_288; \ 47713 uint16x4_t __s2_288 = __p2_288; \ 47714 __ret_288 = vsetq_lane_u16(vget_lane_u16(__s2_288, __p3_288), __s0_288, __p1_288); \ 47715 __ret_288; \ 47716 }) 47717 #else 47718 #define vcopyq_lane_u16(__p0_289, __p1_289, __p2_289, __p3_289) __extension__ ({ \ 47719 uint16x8_t __ret_289; \ 47720 uint16x8_t __s0_289 = __p0_289; \ 47721 uint16x4_t __s2_289 = __p2_289; \ 47722 uint16x8_t __rev0_289; __rev0_289 = __builtin_shufflevector(__s0_289, __s0_289, 7, 6, 5, 4, 3, 2, 1, 0); \ 47723 uint16x4_t __rev2_289; __rev2_289 = __builtin_shufflevector(__s2_289, __s2_289, 3, 2, 1, 0); \ 47724 __ret_289 = __noswap_vsetq_lane_u16(__noswap_vget_lane_u16(__rev2_289, __p3_289), __rev0_289, __p1_289); \ 47725 __ret_289 = __builtin_shufflevector(__ret_289, __ret_289, 7, 6, 5, 4, 3, 2, 1, 0); \ 47726 __ret_289; \ 47727 }) 47728 #endif 47729 47730 #ifdef __LITTLE_ENDIAN__ 47731 #define vcopyq_lane_s8(__p0_290, __p1_290, __p2_290, __p3_290) __extension__ ({ \ 47732 int8x16_t __ret_290; \ 47733 int8x16_t __s0_290 = __p0_290; \ 47734 int8x8_t __s2_290 = __p2_290; \ 47735 __ret_290 = vsetq_lane_s8(vget_lane_s8(__s2_290, __p3_290), __s0_290, __p1_290); \ 47736 __ret_290; \ 47737 }) 47738 #else 47739 #define vcopyq_lane_s8(__p0_291, __p1_291, __p2_291, __p3_291) __extension__ ({ \ 47740 int8x16_t __ret_291; \ 47741 int8x16_t __s0_291 = __p0_291; \ 47742 int8x8_t __s2_291 = __p2_291; \ 47743 int8x16_t __rev0_291; __rev0_291 = __builtin_shufflevector(__s0_291, __s0_291, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 47744 int8x8_t __rev2_291; __rev2_291 = __builtin_shufflevector(__s2_291, __s2_291, 7, 6, 5, 4, 3, 2, 1, 0); \ 47745 __ret_291 = __noswap_vsetq_lane_s8(__noswap_vget_lane_s8(__rev2_291, __p3_291), __rev0_291, __p1_291); \ 47746 __ret_291 = __builtin_shufflevector(__ret_291, __ret_291, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 47747 __ret_291; \ 47748 }) 47749 #endif 47750 47751 #ifdef __LITTLE_ENDIAN__ 47752 #define vcopyq_lane_f32(__p0_292, __p1_292, __p2_292, __p3_292) __extension__ ({ \ 47753 float32x4_t __ret_292; \ 47754 float32x4_t __s0_292 = __p0_292; \ 47755 float32x2_t __s2_292 = __p2_292; \ 47756 __ret_292 = vsetq_lane_f32(vget_lane_f32(__s2_292, __p3_292), __s0_292, __p1_292); \ 47757 __ret_292; \ 47758 }) 47759 #else 47760 #define vcopyq_lane_f32(__p0_293, __p1_293, __p2_293, __p3_293) __extension__ ({ \ 47761 float32x4_t __ret_293; \ 47762 float32x4_t __s0_293 = __p0_293; \ 47763 float32x2_t __s2_293 = __p2_293; \ 47764 float32x4_t __rev0_293; __rev0_293 = __builtin_shufflevector(__s0_293, __s0_293, 3, 2, 1, 0); \ 47765 float32x2_t __rev2_293; __rev2_293 = __builtin_shufflevector(__s2_293, __s2_293, 1, 0); \ 47766 __ret_293 = __noswap_vsetq_lane_f32(__noswap_vget_lane_f32(__rev2_293, __p3_293), __rev0_293, __p1_293); \ 47767 __ret_293 = __builtin_shufflevector(__ret_293, __ret_293, 3, 2, 1, 0); \ 47768 __ret_293; \ 47769 }) 47770 #endif 47771 47772 #ifdef __LITTLE_ENDIAN__ 47773 #define vcopyq_lane_s32(__p0_294, __p1_294, __p2_294, __p3_294) __extension__ ({ \ 47774 int32x4_t __ret_294; \ 47775 int32x4_t __s0_294 = __p0_294; \ 47776 int32x2_t __s2_294 = __p2_294; \ 47777 __ret_294 = vsetq_lane_s32(vget_lane_s32(__s2_294, __p3_294), __s0_294, __p1_294); \ 47778 __ret_294; \ 47779 }) 47780 #else 47781 #define vcopyq_lane_s32(__p0_295, __p1_295, __p2_295, __p3_295) __extension__ ({ \ 47782 int32x4_t __ret_295; \ 47783 int32x4_t __s0_295 = __p0_295; \ 47784 int32x2_t __s2_295 = __p2_295; \ 47785 int32x4_t __rev0_295; __rev0_295 = __builtin_shufflevector(__s0_295, __s0_295, 3, 2, 1, 0); \ 47786 int32x2_t __rev2_295; __rev2_295 = __builtin_shufflevector(__s2_295, __s2_295, 1, 0); \ 47787 __ret_295 = __noswap_vsetq_lane_s32(__noswap_vget_lane_s32(__rev2_295, __p3_295), __rev0_295, __p1_295); \ 47788 __ret_295 = __builtin_shufflevector(__ret_295, __ret_295, 3, 2, 1, 0); \ 47789 __ret_295; \ 47790 }) 47791 #endif 47792 47793 #ifdef __LITTLE_ENDIAN__ 47794 #define vcopyq_lane_s64(__p0_296, __p1_296, __p2_296, __p3_296) __extension__ ({ \ 47795 int64x2_t __ret_296; \ 47796 int64x2_t __s0_296 = __p0_296; \ 47797 int64x1_t __s2_296 = __p2_296; \ 47798 __ret_296 = vsetq_lane_s64(vget_lane_s64(__s2_296, __p3_296), __s0_296, __p1_296); \ 47799 __ret_296; \ 47800 }) 47801 #else 47802 #define vcopyq_lane_s64(__p0_297, __p1_297, __p2_297, __p3_297) __extension__ ({ \ 47803 int64x2_t __ret_297; \ 47804 int64x2_t __s0_297 = __p0_297; \ 47805 int64x1_t __s2_297 = __p2_297; \ 47806 int64x2_t __rev0_297; __rev0_297 = __builtin_shufflevector(__s0_297, __s0_297, 1, 0); \ 47807 __ret_297 = __noswap_vsetq_lane_s64(vget_lane_s64(__s2_297, __p3_297), __rev0_297, __p1_297); \ 47808 __ret_297 = __builtin_shufflevector(__ret_297, __ret_297, 1, 0); \ 47809 __ret_297; \ 47810 }) 47811 #endif 47812 47813 #ifdef __LITTLE_ENDIAN__ 47814 #define vcopyq_lane_s16(__p0_298, __p1_298, __p2_298, __p3_298) __extension__ ({ \ 47815 int16x8_t __ret_298; \ 47816 int16x8_t __s0_298 = __p0_298; \ 47817 int16x4_t __s2_298 = __p2_298; \ 47818 __ret_298 = vsetq_lane_s16(vget_lane_s16(__s2_298, __p3_298), __s0_298, __p1_298); \ 47819 __ret_298; \ 47820 }) 47821 #else 47822 #define vcopyq_lane_s16(__p0_299, __p1_299, __p2_299, __p3_299) __extension__ ({ \ 47823 int16x8_t __ret_299; \ 47824 int16x8_t __s0_299 = __p0_299; \ 47825 int16x4_t __s2_299 = __p2_299; \ 47826 int16x8_t __rev0_299; __rev0_299 = __builtin_shufflevector(__s0_299, __s0_299, 7, 6, 5, 4, 3, 2, 1, 0); \ 47827 int16x4_t __rev2_299; __rev2_299 = __builtin_shufflevector(__s2_299, __s2_299, 3, 2, 1, 0); \ 47828 __ret_299 = __noswap_vsetq_lane_s16(__noswap_vget_lane_s16(__rev2_299, __p3_299), __rev0_299, __p1_299); \ 47829 __ret_299 = __builtin_shufflevector(__ret_299, __ret_299, 7, 6, 5, 4, 3, 2, 1, 0); \ 47830 __ret_299; \ 47831 }) 47832 #endif 47833 47834 #ifdef __LITTLE_ENDIAN__ 47835 #define vcopy_lane_p8(__p0_300, __p1_300, __p2_300, __p3_300) __extension__ ({ \ 47836 poly8x8_t __ret_300; \ 47837 poly8x8_t __s0_300 = __p0_300; \ 47838 poly8x8_t __s2_300 = __p2_300; \ 47839 __ret_300 = vset_lane_p8(vget_lane_p8(__s2_300, __p3_300), __s0_300, __p1_300); \ 47840 __ret_300; \ 47841 }) 47842 #else 47843 #define vcopy_lane_p8(__p0_301, __p1_301, __p2_301, __p3_301) __extension__ ({ \ 47844 poly8x8_t __ret_301; \ 47845 poly8x8_t __s0_301 = __p0_301; \ 47846 poly8x8_t __s2_301 = __p2_301; \ 47847 poly8x8_t __rev0_301; __rev0_301 = __builtin_shufflevector(__s0_301, __s0_301, 7, 6, 5, 4, 3, 2, 1, 0); \ 47848 poly8x8_t __rev2_301; __rev2_301 = __builtin_shufflevector(__s2_301, __s2_301, 7, 6, 5, 4, 3, 2, 1, 0); \ 47849 __ret_301 = __noswap_vset_lane_p8(__noswap_vget_lane_p8(__rev2_301, __p3_301), __rev0_301, __p1_301); \ 47850 __ret_301 = __builtin_shufflevector(__ret_301, __ret_301, 7, 6, 5, 4, 3, 2, 1, 0); \ 47851 __ret_301; \ 47852 }) 47853 #endif 47854 47855 #ifdef __LITTLE_ENDIAN__ 47856 #define vcopy_lane_p16(__p0_302, __p1_302, __p2_302, __p3_302) __extension__ ({ \ 47857 poly16x4_t __ret_302; \ 47858 poly16x4_t __s0_302 = __p0_302; \ 47859 poly16x4_t __s2_302 = __p2_302; \ 47860 __ret_302 = vset_lane_p16(vget_lane_p16(__s2_302, __p3_302), __s0_302, __p1_302); \ 47861 __ret_302; \ 47862 }) 47863 #else 47864 #define vcopy_lane_p16(__p0_303, __p1_303, __p2_303, __p3_303) __extension__ ({ \ 47865 poly16x4_t __ret_303; \ 47866 poly16x4_t __s0_303 = __p0_303; \ 47867 poly16x4_t __s2_303 = __p2_303; \ 47868 poly16x4_t __rev0_303; __rev0_303 = __builtin_shufflevector(__s0_303, __s0_303, 3, 2, 1, 0); \ 47869 poly16x4_t __rev2_303; __rev2_303 = __builtin_shufflevector(__s2_303, __s2_303, 3, 2, 1, 0); \ 47870 __ret_303 = __noswap_vset_lane_p16(__noswap_vget_lane_p16(__rev2_303, __p3_303), __rev0_303, __p1_303); \ 47871 __ret_303 = __builtin_shufflevector(__ret_303, __ret_303, 3, 2, 1, 0); \ 47872 __ret_303; \ 47873 }) 47874 #endif 47875 47876 #ifdef __LITTLE_ENDIAN__ 47877 #define vcopy_lane_u8(__p0_304, __p1_304, __p2_304, __p3_304) __extension__ ({ \ 47878 uint8x8_t __ret_304; \ 47879 uint8x8_t __s0_304 = __p0_304; \ 47880 uint8x8_t __s2_304 = __p2_304; \ 47881 __ret_304 = vset_lane_u8(vget_lane_u8(__s2_304, __p3_304), __s0_304, __p1_304); \ 47882 __ret_304; \ 47883 }) 47884 #else 47885 #define vcopy_lane_u8(__p0_305, __p1_305, __p2_305, __p3_305) __extension__ ({ \ 47886 uint8x8_t __ret_305; \ 47887 uint8x8_t __s0_305 = __p0_305; \ 47888 uint8x8_t __s2_305 = __p2_305; \ 47889 uint8x8_t __rev0_305; __rev0_305 = __builtin_shufflevector(__s0_305, __s0_305, 7, 6, 5, 4, 3, 2, 1, 0); \ 47890 uint8x8_t __rev2_305; __rev2_305 = __builtin_shufflevector(__s2_305, __s2_305, 7, 6, 5, 4, 3, 2, 1, 0); \ 47891 __ret_305 = __noswap_vset_lane_u8(__noswap_vget_lane_u8(__rev2_305, __p3_305), __rev0_305, __p1_305); \ 47892 __ret_305 = __builtin_shufflevector(__ret_305, __ret_305, 7, 6, 5, 4, 3, 2, 1, 0); \ 47893 __ret_305; \ 47894 }) 47895 #endif 47896 47897 #ifdef __LITTLE_ENDIAN__ 47898 #define vcopy_lane_u32(__p0_306, __p1_306, __p2_306, __p3_306) __extension__ ({ \ 47899 uint32x2_t __ret_306; \ 47900 uint32x2_t __s0_306 = __p0_306; \ 47901 uint32x2_t __s2_306 = __p2_306; \ 47902 __ret_306 = vset_lane_u32(vget_lane_u32(__s2_306, __p3_306), __s0_306, __p1_306); \ 47903 __ret_306; \ 47904 }) 47905 #else 47906 #define vcopy_lane_u32(__p0_307, __p1_307, __p2_307, __p3_307) __extension__ ({ \ 47907 uint32x2_t __ret_307; \ 47908 uint32x2_t __s0_307 = __p0_307; \ 47909 uint32x2_t __s2_307 = __p2_307; \ 47910 uint32x2_t __rev0_307; __rev0_307 = __builtin_shufflevector(__s0_307, __s0_307, 1, 0); \ 47911 uint32x2_t __rev2_307; __rev2_307 = __builtin_shufflevector(__s2_307, __s2_307, 1, 0); \ 47912 __ret_307 = __noswap_vset_lane_u32(__noswap_vget_lane_u32(__rev2_307, __p3_307), __rev0_307, __p1_307); \ 47913 __ret_307 = __builtin_shufflevector(__ret_307, __ret_307, 1, 0); \ 47914 __ret_307; \ 47915 }) 47916 #endif 47917 47918 #define vcopy_lane_u64(__p0_308, __p1_308, __p2_308, __p3_308) __extension__ ({ \ 47919 uint64x1_t __ret_308; \ 47920 uint64x1_t __s0_308 = __p0_308; \ 47921 uint64x1_t __s2_308 = __p2_308; \ 47922 __ret_308 = vset_lane_u64(vget_lane_u64(__s2_308, __p3_308), __s0_308, __p1_308); \ 47923 __ret_308; \ 47924 }) 47925 #ifdef __LITTLE_ENDIAN__ 47926 #define vcopy_lane_u16(__p0_309, __p1_309, __p2_309, __p3_309) __extension__ ({ \ 47927 uint16x4_t __ret_309; \ 47928 uint16x4_t __s0_309 = __p0_309; \ 47929 uint16x4_t __s2_309 = __p2_309; \ 47930 __ret_309 = vset_lane_u16(vget_lane_u16(__s2_309, __p3_309), __s0_309, __p1_309); \ 47931 __ret_309; \ 47932 }) 47933 #else 47934 #define vcopy_lane_u16(__p0_310, __p1_310, __p2_310, __p3_310) __extension__ ({ \ 47935 uint16x4_t __ret_310; \ 47936 uint16x4_t __s0_310 = __p0_310; \ 47937 uint16x4_t __s2_310 = __p2_310; \ 47938 uint16x4_t __rev0_310; __rev0_310 = __builtin_shufflevector(__s0_310, __s0_310, 3, 2, 1, 0); \ 47939 uint16x4_t __rev2_310; __rev2_310 = __builtin_shufflevector(__s2_310, __s2_310, 3, 2, 1, 0); \ 47940 __ret_310 = __noswap_vset_lane_u16(__noswap_vget_lane_u16(__rev2_310, __p3_310), __rev0_310, __p1_310); \ 47941 __ret_310 = __builtin_shufflevector(__ret_310, __ret_310, 3, 2, 1, 0); \ 47942 __ret_310; \ 47943 }) 47944 #endif 47945 47946 #ifdef __LITTLE_ENDIAN__ 47947 #define vcopy_lane_s8(__p0_311, __p1_311, __p2_311, __p3_311) __extension__ ({ \ 47948 int8x8_t __ret_311; \ 47949 int8x8_t __s0_311 = __p0_311; \ 47950 int8x8_t __s2_311 = __p2_311; \ 47951 __ret_311 = vset_lane_s8(vget_lane_s8(__s2_311, __p3_311), __s0_311, __p1_311); \ 47952 __ret_311; \ 47953 }) 47954 #else 47955 #define vcopy_lane_s8(__p0_312, __p1_312, __p2_312, __p3_312) __extension__ ({ \ 47956 int8x8_t __ret_312; \ 47957 int8x8_t __s0_312 = __p0_312; \ 47958 int8x8_t __s2_312 = __p2_312; \ 47959 int8x8_t __rev0_312; __rev0_312 = __builtin_shufflevector(__s0_312, __s0_312, 7, 6, 5, 4, 3, 2, 1, 0); \ 47960 int8x8_t __rev2_312; __rev2_312 = __builtin_shufflevector(__s2_312, __s2_312, 7, 6, 5, 4, 3, 2, 1, 0); \ 47961 __ret_312 = __noswap_vset_lane_s8(__noswap_vget_lane_s8(__rev2_312, __p3_312), __rev0_312, __p1_312); \ 47962 __ret_312 = __builtin_shufflevector(__ret_312, __ret_312, 7, 6, 5, 4, 3, 2, 1, 0); \ 47963 __ret_312; \ 47964 }) 47965 #endif 47966 47967 #ifdef __LITTLE_ENDIAN__ 47968 #define vcopy_lane_f32(__p0_313, __p1_313, __p2_313, __p3_313) __extension__ ({ \ 47969 float32x2_t __ret_313; \ 47970 float32x2_t __s0_313 = __p0_313; \ 47971 float32x2_t __s2_313 = __p2_313; \ 47972 __ret_313 = vset_lane_f32(vget_lane_f32(__s2_313, __p3_313), __s0_313, __p1_313); \ 47973 __ret_313; \ 47974 }) 47975 #else 47976 #define vcopy_lane_f32(__p0_314, __p1_314, __p2_314, __p3_314) __extension__ ({ \ 47977 float32x2_t __ret_314; \ 47978 float32x2_t __s0_314 = __p0_314; \ 47979 float32x2_t __s2_314 = __p2_314; \ 47980 float32x2_t __rev0_314; __rev0_314 = __builtin_shufflevector(__s0_314, __s0_314, 1, 0); \ 47981 float32x2_t __rev2_314; __rev2_314 = __builtin_shufflevector(__s2_314, __s2_314, 1, 0); \ 47982 __ret_314 = __noswap_vset_lane_f32(__noswap_vget_lane_f32(__rev2_314, __p3_314), __rev0_314, __p1_314); \ 47983 __ret_314 = __builtin_shufflevector(__ret_314, __ret_314, 1, 0); \ 47984 __ret_314; \ 47985 }) 47986 #endif 47987 47988 #ifdef __LITTLE_ENDIAN__ 47989 #define vcopy_lane_s32(__p0_315, __p1_315, __p2_315, __p3_315) __extension__ ({ \ 47990 int32x2_t __ret_315; \ 47991 int32x2_t __s0_315 = __p0_315; \ 47992 int32x2_t __s2_315 = __p2_315; \ 47993 __ret_315 = vset_lane_s32(vget_lane_s32(__s2_315, __p3_315), __s0_315, __p1_315); \ 47994 __ret_315; \ 47995 }) 47996 #else 47997 #define vcopy_lane_s32(__p0_316, __p1_316, __p2_316, __p3_316) __extension__ ({ \ 47998 int32x2_t __ret_316; \ 47999 int32x2_t __s0_316 = __p0_316; \ 48000 int32x2_t __s2_316 = __p2_316; \ 48001 int32x2_t __rev0_316; __rev0_316 = __builtin_shufflevector(__s0_316, __s0_316, 1, 0); \ 48002 int32x2_t __rev2_316; __rev2_316 = __builtin_shufflevector(__s2_316, __s2_316, 1, 0); \ 48003 __ret_316 = __noswap_vset_lane_s32(__noswap_vget_lane_s32(__rev2_316, __p3_316), __rev0_316, __p1_316); \ 48004 __ret_316 = __builtin_shufflevector(__ret_316, __ret_316, 1, 0); \ 48005 __ret_316; \ 48006 }) 48007 #endif 48008 48009 #define vcopy_lane_s64(__p0_317, __p1_317, __p2_317, __p3_317) __extension__ ({ \ 48010 int64x1_t __ret_317; \ 48011 int64x1_t __s0_317 = __p0_317; \ 48012 int64x1_t __s2_317 = __p2_317; \ 48013 __ret_317 = vset_lane_s64(vget_lane_s64(__s2_317, __p3_317), __s0_317, __p1_317); \ 48014 __ret_317; \ 48015 }) 48016 #ifdef __LITTLE_ENDIAN__ 48017 #define vcopy_lane_s16(__p0_318, __p1_318, __p2_318, __p3_318) __extension__ ({ \ 48018 int16x4_t __ret_318; \ 48019 int16x4_t __s0_318 = __p0_318; \ 48020 int16x4_t __s2_318 = __p2_318; \ 48021 __ret_318 = vset_lane_s16(vget_lane_s16(__s2_318, __p3_318), __s0_318, __p1_318); \ 48022 __ret_318; \ 48023 }) 48024 #else 48025 #define vcopy_lane_s16(__p0_319, __p1_319, __p2_319, __p3_319) __extension__ ({ \ 48026 int16x4_t __ret_319; \ 48027 int16x4_t __s0_319 = __p0_319; \ 48028 int16x4_t __s2_319 = __p2_319; \ 48029 int16x4_t __rev0_319; __rev0_319 = __builtin_shufflevector(__s0_319, __s0_319, 3, 2, 1, 0); \ 48030 int16x4_t __rev2_319; __rev2_319 = __builtin_shufflevector(__s2_319, __s2_319, 3, 2, 1, 0); \ 48031 __ret_319 = __noswap_vset_lane_s16(__noswap_vget_lane_s16(__rev2_319, __p3_319), __rev0_319, __p1_319); \ 48032 __ret_319 = __builtin_shufflevector(__ret_319, __ret_319, 3, 2, 1, 0); \ 48033 __ret_319; \ 48034 }) 48035 #endif 48036 48037 #ifdef __LITTLE_ENDIAN__ 48038 #define vcopyq_laneq_p8(__p0_320, __p1_320, __p2_320, __p3_320) __extension__ ({ \ 48039 poly8x16_t __ret_320; \ 48040 poly8x16_t __s0_320 = __p0_320; \ 48041 poly8x16_t __s2_320 = __p2_320; \ 48042 __ret_320 = vsetq_lane_p8(vgetq_lane_p8(__s2_320, __p3_320), __s0_320, __p1_320); \ 48043 __ret_320; \ 48044 }) 48045 #else 48046 #define vcopyq_laneq_p8(__p0_321, __p1_321, __p2_321, __p3_321) __extension__ ({ \ 48047 poly8x16_t __ret_321; \ 48048 poly8x16_t __s0_321 = __p0_321; \ 48049 poly8x16_t __s2_321 = __p2_321; \ 48050 poly8x16_t __rev0_321; __rev0_321 = __builtin_shufflevector(__s0_321, __s0_321, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 48051 poly8x16_t __rev2_321; __rev2_321 = __builtin_shufflevector(__s2_321, __s2_321, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 48052 __ret_321 = __noswap_vsetq_lane_p8(__noswap_vgetq_lane_p8(__rev2_321, __p3_321), __rev0_321, __p1_321); \ 48053 __ret_321 = __builtin_shufflevector(__ret_321, __ret_321, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 48054 __ret_321; \ 48055 }) 48056 #endif 48057 48058 #ifdef __LITTLE_ENDIAN__ 48059 #define vcopyq_laneq_p16(__p0_322, __p1_322, __p2_322, __p3_322) __extension__ ({ \ 48060 poly16x8_t __ret_322; \ 48061 poly16x8_t __s0_322 = __p0_322; \ 48062 poly16x8_t __s2_322 = __p2_322; \ 48063 __ret_322 = vsetq_lane_p16(vgetq_lane_p16(__s2_322, __p3_322), __s0_322, __p1_322); \ 48064 __ret_322; \ 48065 }) 48066 #else 48067 #define vcopyq_laneq_p16(__p0_323, __p1_323, __p2_323, __p3_323) __extension__ ({ \ 48068 poly16x8_t __ret_323; \ 48069 poly16x8_t __s0_323 = __p0_323; \ 48070 poly16x8_t __s2_323 = __p2_323; \ 48071 poly16x8_t __rev0_323; __rev0_323 = __builtin_shufflevector(__s0_323, __s0_323, 7, 6, 5, 4, 3, 2, 1, 0); \ 48072 poly16x8_t __rev2_323; __rev2_323 = __builtin_shufflevector(__s2_323, __s2_323, 7, 6, 5, 4, 3, 2, 1, 0); \ 48073 __ret_323 = __noswap_vsetq_lane_p16(__noswap_vgetq_lane_p16(__rev2_323, __p3_323), __rev0_323, __p1_323); \ 48074 __ret_323 = __builtin_shufflevector(__ret_323, __ret_323, 7, 6, 5, 4, 3, 2, 1, 0); \ 48075 __ret_323; \ 48076 }) 48077 #endif 48078 48079 #ifdef __LITTLE_ENDIAN__ 48080 #define vcopyq_laneq_u8(__p0_324, __p1_324, __p2_324, __p3_324) __extension__ ({ \ 48081 uint8x16_t __ret_324; \ 48082 uint8x16_t __s0_324 = __p0_324; \ 48083 uint8x16_t __s2_324 = __p2_324; \ 48084 __ret_324 = vsetq_lane_u8(vgetq_lane_u8(__s2_324, __p3_324), __s0_324, __p1_324); \ 48085 __ret_324; \ 48086 }) 48087 #else 48088 #define vcopyq_laneq_u8(__p0_325, __p1_325, __p2_325, __p3_325) __extension__ ({ \ 48089 uint8x16_t __ret_325; \ 48090 uint8x16_t __s0_325 = __p0_325; \ 48091 uint8x16_t __s2_325 = __p2_325; \ 48092 uint8x16_t __rev0_325; __rev0_325 = __builtin_shufflevector(__s0_325, __s0_325, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 48093 uint8x16_t __rev2_325; __rev2_325 = __builtin_shufflevector(__s2_325, __s2_325, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 48094 __ret_325 = __noswap_vsetq_lane_u8(__noswap_vgetq_lane_u8(__rev2_325, __p3_325), __rev0_325, __p1_325); \ 48095 __ret_325 = __builtin_shufflevector(__ret_325, __ret_325, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 48096 __ret_325; \ 48097 }) 48098 #endif 48099 48100 #ifdef __LITTLE_ENDIAN__ 48101 #define vcopyq_laneq_u32(__p0_326, __p1_326, __p2_326, __p3_326) __extension__ ({ \ 48102 uint32x4_t __ret_326; \ 48103 uint32x4_t __s0_326 = __p0_326; \ 48104 uint32x4_t __s2_326 = __p2_326; \ 48105 __ret_326 = vsetq_lane_u32(vgetq_lane_u32(__s2_326, __p3_326), __s0_326, __p1_326); \ 48106 __ret_326; \ 48107 }) 48108 #else 48109 #define vcopyq_laneq_u32(__p0_327, __p1_327, __p2_327, __p3_327) __extension__ ({ \ 48110 uint32x4_t __ret_327; \ 48111 uint32x4_t __s0_327 = __p0_327; \ 48112 uint32x4_t __s2_327 = __p2_327; \ 48113 uint32x4_t __rev0_327; __rev0_327 = __builtin_shufflevector(__s0_327, __s0_327, 3, 2, 1, 0); \ 48114 uint32x4_t __rev2_327; __rev2_327 = __builtin_shufflevector(__s2_327, __s2_327, 3, 2, 1, 0); \ 48115 __ret_327 = __noswap_vsetq_lane_u32(__noswap_vgetq_lane_u32(__rev2_327, __p3_327), __rev0_327, __p1_327); \ 48116 __ret_327 = __builtin_shufflevector(__ret_327, __ret_327, 3, 2, 1, 0); \ 48117 __ret_327; \ 48118 }) 48119 #endif 48120 48121 #ifdef __LITTLE_ENDIAN__ 48122 #define vcopyq_laneq_u64(__p0_328, __p1_328, __p2_328, __p3_328) __extension__ ({ \ 48123 uint64x2_t __ret_328; \ 48124 uint64x2_t __s0_328 = __p0_328; \ 48125 uint64x2_t __s2_328 = __p2_328; \ 48126 __ret_328 = vsetq_lane_u64(vgetq_lane_u64(__s2_328, __p3_328), __s0_328, __p1_328); \ 48127 __ret_328; \ 48128 }) 48129 #else 48130 #define vcopyq_laneq_u64(__p0_329, __p1_329, __p2_329, __p3_329) __extension__ ({ \ 48131 uint64x2_t __ret_329; \ 48132 uint64x2_t __s0_329 = __p0_329; \ 48133 uint64x2_t __s2_329 = __p2_329; \ 48134 uint64x2_t __rev0_329; __rev0_329 = __builtin_shufflevector(__s0_329, __s0_329, 1, 0); \ 48135 uint64x2_t __rev2_329; __rev2_329 = __builtin_shufflevector(__s2_329, __s2_329, 1, 0); \ 48136 __ret_329 = __noswap_vsetq_lane_u64(__noswap_vgetq_lane_u64(__rev2_329, __p3_329), __rev0_329, __p1_329); \ 48137 __ret_329 = __builtin_shufflevector(__ret_329, __ret_329, 1, 0); \ 48138 __ret_329; \ 48139 }) 48140 #endif 48141 48142 #ifdef __LITTLE_ENDIAN__ 48143 #define vcopyq_laneq_u16(__p0_330, __p1_330, __p2_330, __p3_330) __extension__ ({ \ 48144 uint16x8_t __ret_330; \ 48145 uint16x8_t __s0_330 = __p0_330; \ 48146 uint16x8_t __s2_330 = __p2_330; \ 48147 __ret_330 = vsetq_lane_u16(vgetq_lane_u16(__s2_330, __p3_330), __s0_330, __p1_330); \ 48148 __ret_330; \ 48149 }) 48150 #else 48151 #define vcopyq_laneq_u16(__p0_331, __p1_331, __p2_331, __p3_331) __extension__ ({ \ 48152 uint16x8_t __ret_331; \ 48153 uint16x8_t __s0_331 = __p0_331; \ 48154 uint16x8_t __s2_331 = __p2_331; \ 48155 uint16x8_t __rev0_331; __rev0_331 = __builtin_shufflevector(__s0_331, __s0_331, 7, 6, 5, 4, 3, 2, 1, 0); \ 48156 uint16x8_t __rev2_331; __rev2_331 = __builtin_shufflevector(__s2_331, __s2_331, 7, 6, 5, 4, 3, 2, 1, 0); \ 48157 __ret_331 = __noswap_vsetq_lane_u16(__noswap_vgetq_lane_u16(__rev2_331, __p3_331), __rev0_331, __p1_331); \ 48158 __ret_331 = __builtin_shufflevector(__ret_331, __ret_331, 7, 6, 5, 4, 3, 2, 1, 0); \ 48159 __ret_331; \ 48160 }) 48161 #endif 48162 48163 #ifdef __LITTLE_ENDIAN__ 48164 #define vcopyq_laneq_s8(__p0_332, __p1_332, __p2_332, __p3_332) __extension__ ({ \ 48165 int8x16_t __ret_332; \ 48166 int8x16_t __s0_332 = __p0_332; \ 48167 int8x16_t __s2_332 = __p2_332; \ 48168 __ret_332 = vsetq_lane_s8(vgetq_lane_s8(__s2_332, __p3_332), __s0_332, __p1_332); \ 48169 __ret_332; \ 48170 }) 48171 #else 48172 #define vcopyq_laneq_s8(__p0_333, __p1_333, __p2_333, __p3_333) __extension__ ({ \ 48173 int8x16_t __ret_333; \ 48174 int8x16_t __s0_333 = __p0_333; \ 48175 int8x16_t __s2_333 = __p2_333; \ 48176 int8x16_t __rev0_333; __rev0_333 = __builtin_shufflevector(__s0_333, __s0_333, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 48177 int8x16_t __rev2_333; __rev2_333 = __builtin_shufflevector(__s2_333, __s2_333, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 48178 __ret_333 = __noswap_vsetq_lane_s8(__noswap_vgetq_lane_s8(__rev2_333, __p3_333), __rev0_333, __p1_333); \ 48179 __ret_333 = __builtin_shufflevector(__ret_333, __ret_333, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 48180 __ret_333; \ 48181 }) 48182 #endif 48183 48184 #ifdef __LITTLE_ENDIAN__ 48185 #define vcopyq_laneq_f32(__p0_334, __p1_334, __p2_334, __p3_334) __extension__ ({ \ 48186 float32x4_t __ret_334; \ 48187 float32x4_t __s0_334 = __p0_334; \ 48188 float32x4_t __s2_334 = __p2_334; \ 48189 __ret_334 = vsetq_lane_f32(vgetq_lane_f32(__s2_334, __p3_334), __s0_334, __p1_334); \ 48190 __ret_334; \ 48191 }) 48192 #else 48193 #define vcopyq_laneq_f32(__p0_335, __p1_335, __p2_335, __p3_335) __extension__ ({ \ 48194 float32x4_t __ret_335; \ 48195 float32x4_t __s0_335 = __p0_335; \ 48196 float32x4_t __s2_335 = __p2_335; \ 48197 float32x4_t __rev0_335; __rev0_335 = __builtin_shufflevector(__s0_335, __s0_335, 3, 2, 1, 0); \ 48198 float32x4_t __rev2_335; __rev2_335 = __builtin_shufflevector(__s2_335, __s2_335, 3, 2, 1, 0); \ 48199 __ret_335 = __noswap_vsetq_lane_f32(__noswap_vgetq_lane_f32(__rev2_335, __p3_335), __rev0_335, __p1_335); \ 48200 __ret_335 = __builtin_shufflevector(__ret_335, __ret_335, 3, 2, 1, 0); \ 48201 __ret_335; \ 48202 }) 48203 #endif 48204 48205 #ifdef __LITTLE_ENDIAN__ 48206 #define vcopyq_laneq_s32(__p0_336, __p1_336, __p2_336, __p3_336) __extension__ ({ \ 48207 int32x4_t __ret_336; \ 48208 int32x4_t __s0_336 = __p0_336; \ 48209 int32x4_t __s2_336 = __p2_336; \ 48210 __ret_336 = vsetq_lane_s32(vgetq_lane_s32(__s2_336, __p3_336), __s0_336, __p1_336); \ 48211 __ret_336; \ 48212 }) 48213 #else 48214 #define vcopyq_laneq_s32(__p0_337, __p1_337, __p2_337, __p3_337) __extension__ ({ \ 48215 int32x4_t __ret_337; \ 48216 int32x4_t __s0_337 = __p0_337; \ 48217 int32x4_t __s2_337 = __p2_337; \ 48218 int32x4_t __rev0_337; __rev0_337 = __builtin_shufflevector(__s0_337, __s0_337, 3, 2, 1, 0); \ 48219 int32x4_t __rev2_337; __rev2_337 = __builtin_shufflevector(__s2_337, __s2_337, 3, 2, 1, 0); \ 48220 __ret_337 = __noswap_vsetq_lane_s32(__noswap_vgetq_lane_s32(__rev2_337, __p3_337), __rev0_337, __p1_337); \ 48221 __ret_337 = __builtin_shufflevector(__ret_337, __ret_337, 3, 2, 1, 0); \ 48222 __ret_337; \ 48223 }) 48224 #endif 48225 48226 #ifdef __LITTLE_ENDIAN__ 48227 #define vcopyq_laneq_s64(__p0_338, __p1_338, __p2_338, __p3_338) __extension__ ({ \ 48228 int64x2_t __ret_338; \ 48229 int64x2_t __s0_338 = __p0_338; \ 48230 int64x2_t __s2_338 = __p2_338; \ 48231 __ret_338 = vsetq_lane_s64(vgetq_lane_s64(__s2_338, __p3_338), __s0_338, __p1_338); \ 48232 __ret_338; \ 48233 }) 48234 #else 48235 #define vcopyq_laneq_s64(__p0_339, __p1_339, __p2_339, __p3_339) __extension__ ({ \ 48236 int64x2_t __ret_339; \ 48237 int64x2_t __s0_339 = __p0_339; \ 48238 int64x2_t __s2_339 = __p2_339; \ 48239 int64x2_t __rev0_339; __rev0_339 = __builtin_shufflevector(__s0_339, __s0_339, 1, 0); \ 48240 int64x2_t __rev2_339; __rev2_339 = __builtin_shufflevector(__s2_339, __s2_339, 1, 0); \ 48241 __ret_339 = __noswap_vsetq_lane_s64(__noswap_vgetq_lane_s64(__rev2_339, __p3_339), __rev0_339, __p1_339); \ 48242 __ret_339 = __builtin_shufflevector(__ret_339, __ret_339, 1, 0); \ 48243 __ret_339; \ 48244 }) 48245 #endif 48246 48247 #ifdef __LITTLE_ENDIAN__ 48248 #define vcopyq_laneq_s16(__p0_340, __p1_340, __p2_340, __p3_340) __extension__ ({ \ 48249 int16x8_t __ret_340; \ 48250 int16x8_t __s0_340 = __p0_340; \ 48251 int16x8_t __s2_340 = __p2_340; \ 48252 __ret_340 = vsetq_lane_s16(vgetq_lane_s16(__s2_340, __p3_340), __s0_340, __p1_340); \ 48253 __ret_340; \ 48254 }) 48255 #else 48256 #define vcopyq_laneq_s16(__p0_341, __p1_341, __p2_341, __p3_341) __extension__ ({ \ 48257 int16x8_t __ret_341; \ 48258 int16x8_t __s0_341 = __p0_341; \ 48259 int16x8_t __s2_341 = __p2_341; \ 48260 int16x8_t __rev0_341; __rev0_341 = __builtin_shufflevector(__s0_341, __s0_341, 7, 6, 5, 4, 3, 2, 1, 0); \ 48261 int16x8_t __rev2_341; __rev2_341 = __builtin_shufflevector(__s2_341, __s2_341, 7, 6, 5, 4, 3, 2, 1, 0); \ 48262 __ret_341 = __noswap_vsetq_lane_s16(__noswap_vgetq_lane_s16(__rev2_341, __p3_341), __rev0_341, __p1_341); \ 48263 __ret_341 = __builtin_shufflevector(__ret_341, __ret_341, 7, 6, 5, 4, 3, 2, 1, 0); \ 48264 __ret_341; \ 48265 }) 48266 #endif 48267 48268 #ifdef __LITTLE_ENDIAN__ 48269 #define vcopy_laneq_p8(__p0_342, __p1_342, __p2_342, __p3_342) __extension__ ({ \ 48270 poly8x8_t __ret_342; \ 48271 poly8x8_t __s0_342 = __p0_342; \ 48272 poly8x16_t __s2_342 = __p2_342; \ 48273 __ret_342 = vset_lane_p8(vgetq_lane_p8(__s2_342, __p3_342), __s0_342, __p1_342); \ 48274 __ret_342; \ 48275 }) 48276 #else 48277 #define vcopy_laneq_p8(__p0_343, __p1_343, __p2_343, __p3_343) __extension__ ({ \ 48278 poly8x8_t __ret_343; \ 48279 poly8x8_t __s0_343 = __p0_343; \ 48280 poly8x16_t __s2_343 = __p2_343; \ 48281 poly8x8_t __rev0_343; __rev0_343 = __builtin_shufflevector(__s0_343, __s0_343, 7, 6, 5, 4, 3, 2, 1, 0); \ 48282 poly8x16_t __rev2_343; __rev2_343 = __builtin_shufflevector(__s2_343, __s2_343, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 48283 __ret_343 = __noswap_vset_lane_p8(__noswap_vgetq_lane_p8(__rev2_343, __p3_343), __rev0_343, __p1_343); \ 48284 __ret_343 = __builtin_shufflevector(__ret_343, __ret_343, 7, 6, 5, 4, 3, 2, 1, 0); \ 48285 __ret_343; \ 48286 }) 48287 #endif 48288 48289 #ifdef __LITTLE_ENDIAN__ 48290 #define vcopy_laneq_p16(__p0_344, __p1_344, __p2_344, __p3_344) __extension__ ({ \ 48291 poly16x4_t __ret_344; \ 48292 poly16x4_t __s0_344 = __p0_344; \ 48293 poly16x8_t __s2_344 = __p2_344; \ 48294 __ret_344 = vset_lane_p16(vgetq_lane_p16(__s2_344, __p3_344), __s0_344, __p1_344); \ 48295 __ret_344; \ 48296 }) 48297 #else 48298 #define vcopy_laneq_p16(__p0_345, __p1_345, __p2_345, __p3_345) __extension__ ({ \ 48299 poly16x4_t __ret_345; \ 48300 poly16x4_t __s0_345 = __p0_345; \ 48301 poly16x8_t __s2_345 = __p2_345; \ 48302 poly16x4_t __rev0_345; __rev0_345 = __builtin_shufflevector(__s0_345, __s0_345, 3, 2, 1, 0); \ 48303 poly16x8_t __rev2_345; __rev2_345 = __builtin_shufflevector(__s2_345, __s2_345, 7, 6, 5, 4, 3, 2, 1, 0); \ 48304 __ret_345 = __noswap_vset_lane_p16(__noswap_vgetq_lane_p16(__rev2_345, __p3_345), __rev0_345, __p1_345); \ 48305 __ret_345 = __builtin_shufflevector(__ret_345, __ret_345, 3, 2, 1, 0); \ 48306 __ret_345; \ 48307 }) 48308 #endif 48309 48310 #ifdef __LITTLE_ENDIAN__ 48311 #define vcopy_laneq_u8(__p0_346, __p1_346, __p2_346, __p3_346) __extension__ ({ \ 48312 uint8x8_t __ret_346; \ 48313 uint8x8_t __s0_346 = __p0_346; \ 48314 uint8x16_t __s2_346 = __p2_346; \ 48315 __ret_346 = vset_lane_u8(vgetq_lane_u8(__s2_346, __p3_346), __s0_346, __p1_346); \ 48316 __ret_346; \ 48317 }) 48318 #else 48319 #define vcopy_laneq_u8(__p0_347, __p1_347, __p2_347, __p3_347) __extension__ ({ \ 48320 uint8x8_t __ret_347; \ 48321 uint8x8_t __s0_347 = __p0_347; \ 48322 uint8x16_t __s2_347 = __p2_347; \ 48323 uint8x8_t __rev0_347; __rev0_347 = __builtin_shufflevector(__s0_347, __s0_347, 7, 6, 5, 4, 3, 2, 1, 0); \ 48324 uint8x16_t __rev2_347; __rev2_347 = __builtin_shufflevector(__s2_347, __s2_347, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 48325 __ret_347 = __noswap_vset_lane_u8(__noswap_vgetq_lane_u8(__rev2_347, __p3_347), __rev0_347, __p1_347); \ 48326 __ret_347 = __builtin_shufflevector(__ret_347, __ret_347, 7, 6, 5, 4, 3, 2, 1, 0); \ 48327 __ret_347; \ 48328 }) 48329 #endif 48330 48331 #ifdef __LITTLE_ENDIAN__ 48332 #define vcopy_laneq_u32(__p0_348, __p1_348, __p2_348, __p3_348) __extension__ ({ \ 48333 uint32x2_t __ret_348; \ 48334 uint32x2_t __s0_348 = __p0_348; \ 48335 uint32x4_t __s2_348 = __p2_348; \ 48336 __ret_348 = vset_lane_u32(vgetq_lane_u32(__s2_348, __p3_348), __s0_348, __p1_348); \ 48337 __ret_348; \ 48338 }) 48339 #else 48340 #define vcopy_laneq_u32(__p0_349, __p1_349, __p2_349, __p3_349) __extension__ ({ \ 48341 uint32x2_t __ret_349; \ 48342 uint32x2_t __s0_349 = __p0_349; \ 48343 uint32x4_t __s2_349 = __p2_349; \ 48344 uint32x2_t __rev0_349; __rev0_349 = __builtin_shufflevector(__s0_349, __s0_349, 1, 0); \ 48345 uint32x4_t __rev2_349; __rev2_349 = __builtin_shufflevector(__s2_349, __s2_349, 3, 2, 1, 0); \ 48346 __ret_349 = __noswap_vset_lane_u32(__noswap_vgetq_lane_u32(__rev2_349, __p3_349), __rev0_349, __p1_349); \ 48347 __ret_349 = __builtin_shufflevector(__ret_349, __ret_349, 1, 0); \ 48348 __ret_349; \ 48349 }) 48350 #endif 48351 48352 #ifdef __LITTLE_ENDIAN__ 48353 #define vcopy_laneq_u64(__p0_350, __p1_350, __p2_350, __p3_350) __extension__ ({ \ 48354 uint64x1_t __ret_350; \ 48355 uint64x1_t __s0_350 = __p0_350; \ 48356 uint64x2_t __s2_350 = __p2_350; \ 48357 __ret_350 = vset_lane_u64(vgetq_lane_u64(__s2_350, __p3_350), __s0_350, __p1_350); \ 48358 __ret_350; \ 48359 }) 48360 #else 48361 #define vcopy_laneq_u64(__p0_351, __p1_351, __p2_351, __p3_351) __extension__ ({ \ 48362 uint64x1_t __ret_351; \ 48363 uint64x1_t __s0_351 = __p0_351; \ 48364 uint64x2_t __s2_351 = __p2_351; \ 48365 uint64x2_t __rev2_351; __rev2_351 = __builtin_shufflevector(__s2_351, __s2_351, 1, 0); \ 48366 __ret_351 = vset_lane_u64(__noswap_vgetq_lane_u64(__rev2_351, __p3_351), __s0_351, __p1_351); \ 48367 __ret_351; \ 48368 }) 48369 #endif 48370 48371 #ifdef __LITTLE_ENDIAN__ 48372 #define vcopy_laneq_u16(__p0_352, __p1_352, __p2_352, __p3_352) __extension__ ({ \ 48373 uint16x4_t __ret_352; \ 48374 uint16x4_t __s0_352 = __p0_352; \ 48375 uint16x8_t __s2_352 = __p2_352; \ 48376 __ret_352 = vset_lane_u16(vgetq_lane_u16(__s2_352, __p3_352), __s0_352, __p1_352); \ 48377 __ret_352; \ 48378 }) 48379 #else 48380 #define vcopy_laneq_u16(__p0_353, __p1_353, __p2_353, __p3_353) __extension__ ({ \ 48381 uint16x4_t __ret_353; \ 48382 uint16x4_t __s0_353 = __p0_353; \ 48383 uint16x8_t __s2_353 = __p2_353; \ 48384 uint16x4_t __rev0_353; __rev0_353 = __builtin_shufflevector(__s0_353, __s0_353, 3, 2, 1, 0); \ 48385 uint16x8_t __rev2_353; __rev2_353 = __builtin_shufflevector(__s2_353, __s2_353, 7, 6, 5, 4, 3, 2, 1, 0); \ 48386 __ret_353 = __noswap_vset_lane_u16(__noswap_vgetq_lane_u16(__rev2_353, __p3_353), __rev0_353, __p1_353); \ 48387 __ret_353 = __builtin_shufflevector(__ret_353, __ret_353, 3, 2, 1, 0); \ 48388 __ret_353; \ 48389 }) 48390 #endif 48391 48392 #ifdef __LITTLE_ENDIAN__ 48393 #define vcopy_laneq_s8(__p0_354, __p1_354, __p2_354, __p3_354) __extension__ ({ \ 48394 int8x8_t __ret_354; \ 48395 int8x8_t __s0_354 = __p0_354; \ 48396 int8x16_t __s2_354 = __p2_354; \ 48397 __ret_354 = vset_lane_s8(vgetq_lane_s8(__s2_354, __p3_354), __s0_354, __p1_354); \ 48398 __ret_354; \ 48399 }) 48400 #else 48401 #define vcopy_laneq_s8(__p0_355, __p1_355, __p2_355, __p3_355) __extension__ ({ \ 48402 int8x8_t __ret_355; \ 48403 int8x8_t __s0_355 = __p0_355; \ 48404 int8x16_t __s2_355 = __p2_355; \ 48405 int8x8_t __rev0_355; __rev0_355 = __builtin_shufflevector(__s0_355, __s0_355, 7, 6, 5, 4, 3, 2, 1, 0); \ 48406 int8x16_t __rev2_355; __rev2_355 = __builtin_shufflevector(__s2_355, __s2_355, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 48407 __ret_355 = __noswap_vset_lane_s8(__noswap_vgetq_lane_s8(__rev2_355, __p3_355), __rev0_355, __p1_355); \ 48408 __ret_355 = __builtin_shufflevector(__ret_355, __ret_355, 7, 6, 5, 4, 3, 2, 1, 0); \ 48409 __ret_355; \ 48410 }) 48411 #endif 48412 48413 #ifdef __LITTLE_ENDIAN__ 48414 #define vcopy_laneq_f32(__p0_356, __p1_356, __p2_356, __p3_356) __extension__ ({ \ 48415 float32x2_t __ret_356; \ 48416 float32x2_t __s0_356 = __p0_356; \ 48417 float32x4_t __s2_356 = __p2_356; \ 48418 __ret_356 = vset_lane_f32(vgetq_lane_f32(__s2_356, __p3_356), __s0_356, __p1_356); \ 48419 __ret_356; \ 48420 }) 48421 #else 48422 #define vcopy_laneq_f32(__p0_357, __p1_357, __p2_357, __p3_357) __extension__ ({ \ 48423 float32x2_t __ret_357; \ 48424 float32x2_t __s0_357 = __p0_357; \ 48425 float32x4_t __s2_357 = __p2_357; \ 48426 float32x2_t __rev0_357; __rev0_357 = __builtin_shufflevector(__s0_357, __s0_357, 1, 0); \ 48427 float32x4_t __rev2_357; __rev2_357 = __builtin_shufflevector(__s2_357, __s2_357, 3, 2, 1, 0); \ 48428 __ret_357 = __noswap_vset_lane_f32(__noswap_vgetq_lane_f32(__rev2_357, __p3_357), __rev0_357, __p1_357); \ 48429 __ret_357 = __builtin_shufflevector(__ret_357, __ret_357, 1, 0); \ 48430 __ret_357; \ 48431 }) 48432 #endif 48433 48434 #ifdef __LITTLE_ENDIAN__ 48435 #define vcopy_laneq_s32(__p0_358, __p1_358, __p2_358, __p3_358) __extension__ ({ \ 48436 int32x2_t __ret_358; \ 48437 int32x2_t __s0_358 = __p0_358; \ 48438 int32x4_t __s2_358 = __p2_358; \ 48439 __ret_358 = vset_lane_s32(vgetq_lane_s32(__s2_358, __p3_358), __s0_358, __p1_358); \ 48440 __ret_358; \ 48441 }) 48442 #else 48443 #define vcopy_laneq_s32(__p0_359, __p1_359, __p2_359, __p3_359) __extension__ ({ \ 48444 int32x2_t __ret_359; \ 48445 int32x2_t __s0_359 = __p0_359; \ 48446 int32x4_t __s2_359 = __p2_359; \ 48447 int32x2_t __rev0_359; __rev0_359 = __builtin_shufflevector(__s0_359, __s0_359, 1, 0); \ 48448 int32x4_t __rev2_359; __rev2_359 = __builtin_shufflevector(__s2_359, __s2_359, 3, 2, 1, 0); \ 48449 __ret_359 = __noswap_vset_lane_s32(__noswap_vgetq_lane_s32(__rev2_359, __p3_359), __rev0_359, __p1_359); \ 48450 __ret_359 = __builtin_shufflevector(__ret_359, __ret_359, 1, 0); \ 48451 __ret_359; \ 48452 }) 48453 #endif 48454 48455 #ifdef __LITTLE_ENDIAN__ 48456 #define vcopy_laneq_s64(__p0_360, __p1_360, __p2_360, __p3_360) __extension__ ({ \ 48457 int64x1_t __ret_360; \ 48458 int64x1_t __s0_360 = __p0_360; \ 48459 int64x2_t __s2_360 = __p2_360; \ 48460 __ret_360 = vset_lane_s64(vgetq_lane_s64(__s2_360, __p3_360), __s0_360, __p1_360); \ 48461 __ret_360; \ 48462 }) 48463 #else 48464 #define vcopy_laneq_s64(__p0_361, __p1_361, __p2_361, __p3_361) __extension__ ({ \ 48465 int64x1_t __ret_361; \ 48466 int64x1_t __s0_361 = __p0_361; \ 48467 int64x2_t __s2_361 = __p2_361; \ 48468 int64x2_t __rev2_361; __rev2_361 = __builtin_shufflevector(__s2_361, __s2_361, 1, 0); \ 48469 __ret_361 = vset_lane_s64(__noswap_vgetq_lane_s64(__rev2_361, __p3_361), __s0_361, __p1_361); \ 48470 __ret_361; \ 48471 }) 48472 #endif 48473 48474 #ifdef __LITTLE_ENDIAN__ 48475 #define vcopy_laneq_s16(__p0_362, __p1_362, __p2_362, __p3_362) __extension__ ({ \ 48476 int16x4_t __ret_362; \ 48477 int16x4_t __s0_362 = __p0_362; \ 48478 int16x8_t __s2_362 = __p2_362; \ 48479 __ret_362 = vset_lane_s16(vgetq_lane_s16(__s2_362, __p3_362), __s0_362, __p1_362); \ 48480 __ret_362; \ 48481 }) 48482 #else 48483 #define vcopy_laneq_s16(__p0_363, __p1_363, __p2_363, __p3_363) __extension__ ({ \ 48484 int16x4_t __ret_363; \ 48485 int16x4_t __s0_363 = __p0_363; \ 48486 int16x8_t __s2_363 = __p2_363; \ 48487 int16x4_t __rev0_363; __rev0_363 = __builtin_shufflevector(__s0_363, __s0_363, 3, 2, 1, 0); \ 48488 int16x8_t __rev2_363; __rev2_363 = __builtin_shufflevector(__s2_363, __s2_363, 7, 6, 5, 4, 3, 2, 1, 0); \ 48489 __ret_363 = __noswap_vset_lane_s16(__noswap_vgetq_lane_s16(__rev2_363, __p3_363), __rev0_363, __p1_363); \ 48490 __ret_363 = __builtin_shufflevector(__ret_363, __ret_363, 3, 2, 1, 0); \ 48491 __ret_363; \ 48492 }) 48493 #endif 48494 48495 #define vcreate_p64(__p0) __extension__ ({ \ 48496 poly64x1_t __ret; \ 48497 uint64_t __promote = __p0; \ 48498 __ret = (poly64x1_t)(__promote); \ 48499 __ret; \ 48500 }) 48501 #define vcreate_f64(__p0) __extension__ ({ \ 48502 float64x1_t __ret; \ 48503 uint64_t __promote = __p0; \ 48504 __ret = (float64x1_t)(__promote); \ 48505 __ret; \ 48506 }) 48507 __ai __attribute__((target("neon"))) float32_t vcvts_f32_s32(int32_t __p0) { 48508 float32_t __ret; 48509 __ret = (float32_t) __builtin_neon_vcvts_f32_s32(__p0); 48510 return __ret; 48511 } 48512 __ai __attribute__((target("neon"))) float32_t vcvts_f32_u32(uint32_t __p0) { 48513 float32_t __ret; 48514 __ret = (float32_t) __builtin_neon_vcvts_f32_u32(__p0); 48515 return __ret; 48516 } 48517 #ifdef __LITTLE_ENDIAN__ 48518 __ai __attribute__((target("neon"))) float32x2_t vcvt_f32_f64(float64x2_t __p0) { 48519 float32x2_t __ret; 48520 __ret = (float32x2_t) __builtin_neon_vcvt_f32_f64((int8x16_t)__p0, 9); 48521 return __ret; 48522 } 48523 #else 48524 __ai __attribute__((target("neon"))) float32x2_t vcvt_f32_f64(float64x2_t __p0) { 48525 float32x2_t __ret; 48526 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 48527 __ret = (float32x2_t) __builtin_neon_vcvt_f32_f64((int8x16_t)__rev0, 9); 48528 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 48529 return __ret; 48530 } 48531 __ai __attribute__((target("neon"))) float32x2_t __noswap_vcvt_f32_f64(float64x2_t __p0) { 48532 float32x2_t __ret; 48533 __ret = (float32x2_t) __builtin_neon_vcvt_f32_f64((int8x16_t)__p0, 9); 48534 return __ret; 48535 } 48536 #endif 48537 48538 __ai __attribute__((target("neon"))) float64_t vcvtd_f64_s64(int64_t __p0) { 48539 float64_t __ret; 48540 __ret = (float64_t) __builtin_neon_vcvtd_f64_s64(__p0); 48541 return __ret; 48542 } 48543 __ai __attribute__((target("neon"))) float64_t vcvtd_f64_u64(uint64_t __p0) { 48544 float64_t __ret; 48545 __ret = (float64_t) __builtin_neon_vcvtd_f64_u64(__p0); 48546 return __ret; 48547 } 48548 #ifdef __LITTLE_ENDIAN__ 48549 __ai __attribute__((target("neon"))) float64x2_t vcvtq_f64_u64(uint64x2_t __p0) { 48550 float64x2_t __ret; 48551 __ret = (float64x2_t) __builtin_neon_vcvtq_f64_v((int8x16_t)__p0, 51); 48552 return __ret; 48553 } 48554 #else 48555 __ai __attribute__((target("neon"))) float64x2_t vcvtq_f64_u64(uint64x2_t __p0) { 48556 float64x2_t __ret; 48557 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 48558 __ret = (float64x2_t) __builtin_neon_vcvtq_f64_v((int8x16_t)__rev0, 51); 48559 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 48560 return __ret; 48561 } 48562 #endif 48563 48564 #ifdef __LITTLE_ENDIAN__ 48565 __ai __attribute__((target("neon"))) float64x2_t vcvtq_f64_s64(int64x2_t __p0) { 48566 float64x2_t __ret; 48567 __ret = (float64x2_t) __builtin_neon_vcvtq_f64_v((int8x16_t)__p0, 35); 48568 return __ret; 48569 } 48570 #else 48571 __ai __attribute__((target("neon"))) float64x2_t vcvtq_f64_s64(int64x2_t __p0) { 48572 float64x2_t __ret; 48573 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 48574 __ret = (float64x2_t) __builtin_neon_vcvtq_f64_v((int8x16_t)__rev0, 35); 48575 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 48576 return __ret; 48577 } 48578 #endif 48579 48580 __ai __attribute__((target("neon"))) float64x1_t vcvt_f64_u64(uint64x1_t __p0) { 48581 float64x1_t __ret; 48582 __ret = (float64x1_t) __builtin_neon_vcvt_f64_v((int8x8_t)__p0, 19); 48583 return __ret; 48584 } 48585 __ai __attribute__((target("neon"))) float64x1_t vcvt_f64_s64(int64x1_t __p0) { 48586 float64x1_t __ret; 48587 __ret = (float64x1_t) __builtin_neon_vcvt_f64_v((int8x8_t)__p0, 3); 48588 return __ret; 48589 } 48590 #ifdef __LITTLE_ENDIAN__ 48591 __ai __attribute__((target("neon"))) float64x2_t vcvt_f64_f32(float32x2_t __p0) { 48592 float64x2_t __ret; 48593 __ret = (float64x2_t) __builtin_neon_vcvt_f64_f32((int8x8_t)__p0, 42); 48594 return __ret; 48595 } 48596 #else 48597 __ai __attribute__((target("neon"))) float64x2_t vcvt_f64_f32(float32x2_t __p0) { 48598 float64x2_t __ret; 48599 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 48600 __ret = (float64x2_t) __builtin_neon_vcvt_f64_f32((int8x8_t)__rev0, 42); 48601 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 48602 return __ret; 48603 } 48604 __ai __attribute__((target("neon"))) float64x2_t __noswap_vcvt_f64_f32(float32x2_t __p0) { 48605 float64x2_t __ret; 48606 __ret = (float64x2_t) __builtin_neon_vcvt_f64_f32((int8x8_t)__p0, 42); 48607 return __ret; 48608 } 48609 #endif 48610 48611 #ifdef __LITTLE_ENDIAN__ 48612 __ai __attribute__((target("neon"))) float16x8_t vcvt_high_f16_f32(float16x4_t __p0, float32x4_t __p1) { 48613 float16x8_t __ret; 48614 __ret = vcombine_f16(__p0, vcvt_f16_f32(__p1)); 48615 return __ret; 48616 } 48617 #else 48618 __ai __attribute__((target("neon"))) float16x8_t vcvt_high_f16_f32(float16x4_t __p0, float32x4_t __p1) { 48619 float16x8_t __ret; 48620 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 48621 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 48622 __ret = __noswap_vcombine_f16(__rev0, __noswap_vcvt_f16_f32(__rev1)); 48623 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 48624 return __ret; 48625 } 48626 #endif 48627 48628 #ifdef __LITTLE_ENDIAN__ 48629 __ai __attribute__((target("neon"))) float32x4_t vcvt_high_f32_f16(float16x8_t __p0) { 48630 float32x4_t __ret; 48631 __ret = vcvt_f32_f16(vget_high_f16(__p0)); 48632 return __ret; 48633 } 48634 #else 48635 __ai __attribute__((target("neon"))) float32x4_t vcvt_high_f32_f16(float16x8_t __p0) { 48636 float32x4_t __ret; 48637 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 48638 __ret = __noswap_vcvt_f32_f16(__noswap_vget_high_f16(__rev0)); 48639 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 48640 return __ret; 48641 } 48642 #endif 48643 48644 #ifdef __LITTLE_ENDIAN__ 48645 __ai __attribute__((target("neon"))) float32x4_t vcvt_high_f32_f64(float32x2_t __p0, float64x2_t __p1) { 48646 float32x4_t __ret; 48647 __ret = vcombine_f32(__p0, vcvt_f32_f64(__p1)); 48648 return __ret; 48649 } 48650 #else 48651 __ai __attribute__((target("neon"))) float32x4_t vcvt_high_f32_f64(float32x2_t __p0, float64x2_t __p1) { 48652 float32x4_t __ret; 48653 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 48654 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 48655 __ret = __noswap_vcombine_f32(__rev0, __noswap_vcvt_f32_f64(__rev1)); 48656 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 48657 return __ret; 48658 } 48659 #endif 48660 48661 #ifdef __LITTLE_ENDIAN__ 48662 __ai __attribute__((target("neon"))) float64x2_t vcvt_high_f64_f32(float32x4_t __p0) { 48663 float64x2_t __ret; 48664 __ret = vcvt_f64_f32(vget_high_f32(__p0)); 48665 return __ret; 48666 } 48667 #else 48668 __ai __attribute__((target("neon"))) float64x2_t vcvt_high_f64_f32(float32x4_t __p0) { 48669 float64x2_t __ret; 48670 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 48671 __ret = __noswap_vcvt_f64_f32(__noswap_vget_high_f32(__rev0)); 48672 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 48673 return __ret; 48674 } 48675 #endif 48676 48677 #define vcvts_n_f32_u32(__p0, __p1) __extension__ ({ \ 48678 float32_t __ret; \ 48679 uint32_t __s0 = __p0; \ 48680 __ret = (float32_t) __builtin_neon_vcvts_n_f32_u32(__s0, __p1); \ 48681 __ret; \ 48682 }) 48683 #define vcvts_n_f32_s32(__p0, __p1) __extension__ ({ \ 48684 float32_t __ret; \ 48685 int32_t __s0 = __p0; \ 48686 __ret = (float32_t) __builtin_neon_vcvts_n_f32_s32(__s0, __p1); \ 48687 __ret; \ 48688 }) 48689 #ifdef __LITTLE_ENDIAN__ 48690 #define vcvtq_n_f64_u64(__p0, __p1) __extension__ ({ \ 48691 float64x2_t __ret; \ 48692 uint64x2_t __s0 = __p0; \ 48693 __ret = (float64x2_t) __builtin_neon_vcvtq_n_f64_v((int8x16_t)__s0, __p1, 51); \ 48694 __ret; \ 48695 }) 48696 #else 48697 #define vcvtq_n_f64_u64(__p0, __p1) __extension__ ({ \ 48698 float64x2_t __ret; \ 48699 uint64x2_t __s0 = __p0; \ 48700 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 48701 __ret = (float64x2_t) __builtin_neon_vcvtq_n_f64_v((int8x16_t)__rev0, __p1, 51); \ 48702 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 48703 __ret; \ 48704 }) 48705 #endif 48706 48707 #ifdef __LITTLE_ENDIAN__ 48708 #define vcvtq_n_f64_s64(__p0, __p1) __extension__ ({ \ 48709 float64x2_t __ret; \ 48710 int64x2_t __s0 = __p0; \ 48711 __ret = (float64x2_t) __builtin_neon_vcvtq_n_f64_v((int8x16_t)__s0, __p1, 35); \ 48712 __ret; \ 48713 }) 48714 #else 48715 #define vcvtq_n_f64_s64(__p0, __p1) __extension__ ({ \ 48716 float64x2_t __ret; \ 48717 int64x2_t __s0 = __p0; \ 48718 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 48719 __ret = (float64x2_t) __builtin_neon_vcvtq_n_f64_v((int8x16_t)__rev0, __p1, 35); \ 48720 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 48721 __ret; \ 48722 }) 48723 #endif 48724 48725 #define vcvt_n_f64_u64(__p0, __p1) __extension__ ({ \ 48726 float64x1_t __ret; \ 48727 uint64x1_t __s0 = __p0; \ 48728 __ret = (float64x1_t) __builtin_neon_vcvt_n_f64_v((int8x8_t)__s0, __p1, 19); \ 48729 __ret; \ 48730 }) 48731 #define vcvt_n_f64_s64(__p0, __p1) __extension__ ({ \ 48732 float64x1_t __ret; \ 48733 int64x1_t __s0 = __p0; \ 48734 __ret = (float64x1_t) __builtin_neon_vcvt_n_f64_v((int8x8_t)__s0, __p1, 3); \ 48735 __ret; \ 48736 }) 48737 #define vcvtd_n_f64_u64(__p0, __p1) __extension__ ({ \ 48738 float64_t __ret; \ 48739 uint64_t __s0 = __p0; \ 48740 __ret = (float64_t) __builtin_neon_vcvtd_n_f64_u64(__s0, __p1); \ 48741 __ret; \ 48742 }) 48743 #define vcvtd_n_f64_s64(__p0, __p1) __extension__ ({ \ 48744 float64_t __ret; \ 48745 int64_t __s0 = __p0; \ 48746 __ret = (float64_t) __builtin_neon_vcvtd_n_f64_s64(__s0, __p1); \ 48747 __ret; \ 48748 }) 48749 #define vcvts_n_s32_f32(__p0, __p1) __extension__ ({ \ 48750 int32_t __ret; \ 48751 float32_t __s0 = __p0; \ 48752 __ret = (int32_t) __builtin_neon_vcvts_n_s32_f32(__s0, __p1); \ 48753 __ret; \ 48754 }) 48755 #ifdef __LITTLE_ENDIAN__ 48756 #define vcvtq_n_s64_f64(__p0, __p1) __extension__ ({ \ 48757 int64x2_t __ret; \ 48758 float64x2_t __s0 = __p0; \ 48759 __ret = (int64x2_t) __builtin_neon_vcvtq_n_s64_v((int8x16_t)__s0, __p1, 35); \ 48760 __ret; \ 48761 }) 48762 #else 48763 #define vcvtq_n_s64_f64(__p0, __p1) __extension__ ({ \ 48764 int64x2_t __ret; \ 48765 float64x2_t __s0 = __p0; \ 48766 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 48767 __ret = (int64x2_t) __builtin_neon_vcvtq_n_s64_v((int8x16_t)__rev0, __p1, 35); \ 48768 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 48769 __ret; \ 48770 }) 48771 #endif 48772 48773 #define vcvt_n_s64_f64(__p0, __p1) __extension__ ({ \ 48774 int64x1_t __ret; \ 48775 float64x1_t __s0 = __p0; \ 48776 __ret = (int64x1_t) __builtin_neon_vcvt_n_s64_v((int8x8_t)__s0, __p1, 3); \ 48777 __ret; \ 48778 }) 48779 #define vcvtd_n_s64_f64(__p0, __p1) __extension__ ({ \ 48780 int64_t __ret; \ 48781 float64_t __s0 = __p0; \ 48782 __ret = (int64_t) __builtin_neon_vcvtd_n_s64_f64(__s0, __p1); \ 48783 __ret; \ 48784 }) 48785 #define vcvts_n_u32_f32(__p0, __p1) __extension__ ({ \ 48786 uint32_t __ret; \ 48787 float32_t __s0 = __p0; \ 48788 __ret = (uint32_t) __builtin_neon_vcvts_n_u32_f32(__s0, __p1); \ 48789 __ret; \ 48790 }) 48791 #ifdef __LITTLE_ENDIAN__ 48792 #define vcvtq_n_u64_f64(__p0, __p1) __extension__ ({ \ 48793 uint64x2_t __ret; \ 48794 float64x2_t __s0 = __p0; \ 48795 __ret = (uint64x2_t) __builtin_neon_vcvtq_n_u64_v((int8x16_t)__s0, __p1, 51); \ 48796 __ret; \ 48797 }) 48798 #else 48799 #define vcvtq_n_u64_f64(__p0, __p1) __extension__ ({ \ 48800 uint64x2_t __ret; \ 48801 float64x2_t __s0 = __p0; \ 48802 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 48803 __ret = (uint64x2_t) __builtin_neon_vcvtq_n_u64_v((int8x16_t)__rev0, __p1, 51); \ 48804 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 48805 __ret; \ 48806 }) 48807 #endif 48808 48809 #define vcvt_n_u64_f64(__p0, __p1) __extension__ ({ \ 48810 uint64x1_t __ret; \ 48811 float64x1_t __s0 = __p0; \ 48812 __ret = (uint64x1_t) __builtin_neon_vcvt_n_u64_v((int8x8_t)__s0, __p1, 19); \ 48813 __ret; \ 48814 }) 48815 #define vcvtd_n_u64_f64(__p0, __p1) __extension__ ({ \ 48816 uint64_t __ret; \ 48817 float64_t __s0 = __p0; \ 48818 __ret = (uint64_t) __builtin_neon_vcvtd_n_u64_f64(__s0, __p1); \ 48819 __ret; \ 48820 }) 48821 __ai __attribute__((target("neon"))) int32_t vcvts_s32_f32(float32_t __p0) { 48822 int32_t __ret; 48823 __ret = (int32_t) __builtin_neon_vcvts_s32_f32(__p0); 48824 return __ret; 48825 } 48826 __ai __attribute__((target("neon"))) int64_t vcvtd_s64_f64(float64_t __p0) { 48827 int64_t __ret; 48828 __ret = (int64_t) __builtin_neon_vcvtd_s64_f64(__p0); 48829 return __ret; 48830 } 48831 #ifdef __LITTLE_ENDIAN__ 48832 __ai __attribute__((target("neon"))) int64x2_t vcvtq_s64_f64(float64x2_t __p0) { 48833 int64x2_t __ret; 48834 __ret = (int64x2_t) __builtin_neon_vcvtq_s64_v((int8x16_t)__p0, 35); 48835 return __ret; 48836 } 48837 #else 48838 __ai __attribute__((target("neon"))) int64x2_t vcvtq_s64_f64(float64x2_t __p0) { 48839 int64x2_t __ret; 48840 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 48841 __ret = (int64x2_t) __builtin_neon_vcvtq_s64_v((int8x16_t)__rev0, 35); 48842 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 48843 return __ret; 48844 } 48845 #endif 48846 48847 __ai __attribute__((target("neon"))) int64x1_t vcvt_s64_f64(float64x1_t __p0) { 48848 int64x1_t __ret; 48849 __ret = (int64x1_t) __builtin_neon_vcvt_s64_v((int8x8_t)__p0, 3); 48850 return __ret; 48851 } 48852 __ai __attribute__((target("neon"))) uint32_t vcvts_u32_f32(float32_t __p0) { 48853 uint32_t __ret; 48854 __ret = (uint32_t) __builtin_neon_vcvts_u32_f32(__p0); 48855 return __ret; 48856 } 48857 __ai __attribute__((target("neon"))) uint64_t vcvtd_u64_f64(float64_t __p0) { 48858 uint64_t __ret; 48859 __ret = (uint64_t) __builtin_neon_vcvtd_u64_f64(__p0); 48860 return __ret; 48861 } 48862 #ifdef __LITTLE_ENDIAN__ 48863 __ai __attribute__((target("neon"))) uint64x2_t vcvtq_u64_f64(float64x2_t __p0) { 48864 uint64x2_t __ret; 48865 __ret = (uint64x2_t) __builtin_neon_vcvtq_u64_v((int8x16_t)__p0, 51); 48866 return __ret; 48867 } 48868 #else 48869 __ai __attribute__((target("neon"))) uint64x2_t vcvtq_u64_f64(float64x2_t __p0) { 48870 uint64x2_t __ret; 48871 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 48872 __ret = (uint64x2_t) __builtin_neon_vcvtq_u64_v((int8x16_t)__rev0, 51); 48873 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 48874 return __ret; 48875 } 48876 #endif 48877 48878 __ai __attribute__((target("neon"))) uint64x1_t vcvt_u64_f64(float64x1_t __p0) { 48879 uint64x1_t __ret; 48880 __ret = (uint64x1_t) __builtin_neon_vcvt_u64_v((int8x8_t)__p0, 19); 48881 return __ret; 48882 } 48883 __ai __attribute__((target("neon"))) int32_t vcvtas_s32_f32(float32_t __p0) { 48884 int32_t __ret; 48885 __ret = (int32_t) __builtin_neon_vcvtas_s32_f32(__p0); 48886 return __ret; 48887 } 48888 #ifdef __LITTLE_ENDIAN__ 48889 __ai __attribute__((target("neon"))) int64x2_t vcvtaq_s64_f64(float64x2_t __p0) { 48890 int64x2_t __ret; 48891 __ret = (int64x2_t) __builtin_neon_vcvtaq_s64_v((int8x16_t)__p0, 35); 48892 return __ret; 48893 } 48894 #else 48895 __ai __attribute__((target("neon"))) int64x2_t vcvtaq_s64_f64(float64x2_t __p0) { 48896 int64x2_t __ret; 48897 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 48898 __ret = (int64x2_t) __builtin_neon_vcvtaq_s64_v((int8x16_t)__rev0, 35); 48899 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 48900 return __ret; 48901 } 48902 #endif 48903 48904 __ai __attribute__((target("neon"))) int64x1_t vcvta_s64_f64(float64x1_t __p0) { 48905 int64x1_t __ret; 48906 __ret = (int64x1_t) __builtin_neon_vcvta_s64_v((int8x8_t)__p0, 3); 48907 return __ret; 48908 } 48909 __ai __attribute__((target("neon"))) int64_t vcvtad_s64_f64(float64_t __p0) { 48910 int64_t __ret; 48911 __ret = (int64_t) __builtin_neon_vcvtad_s64_f64(__p0); 48912 return __ret; 48913 } 48914 __ai __attribute__((target("neon"))) uint32_t vcvtas_u32_f32(float32_t __p0) { 48915 uint32_t __ret; 48916 __ret = (uint32_t) __builtin_neon_vcvtas_u32_f32(__p0); 48917 return __ret; 48918 } 48919 #ifdef __LITTLE_ENDIAN__ 48920 __ai __attribute__((target("neon"))) uint64x2_t vcvtaq_u64_f64(float64x2_t __p0) { 48921 uint64x2_t __ret; 48922 __ret = (uint64x2_t) __builtin_neon_vcvtaq_u64_v((int8x16_t)__p0, 51); 48923 return __ret; 48924 } 48925 #else 48926 __ai __attribute__((target("neon"))) uint64x2_t vcvtaq_u64_f64(float64x2_t __p0) { 48927 uint64x2_t __ret; 48928 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 48929 __ret = (uint64x2_t) __builtin_neon_vcvtaq_u64_v((int8x16_t)__rev0, 51); 48930 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 48931 return __ret; 48932 } 48933 #endif 48934 48935 __ai __attribute__((target("neon"))) uint64x1_t vcvta_u64_f64(float64x1_t __p0) { 48936 uint64x1_t __ret; 48937 __ret = (uint64x1_t) __builtin_neon_vcvta_u64_v((int8x8_t)__p0, 19); 48938 return __ret; 48939 } 48940 __ai __attribute__((target("neon"))) uint64_t vcvtad_u64_f64(float64_t __p0) { 48941 uint64_t __ret; 48942 __ret = (uint64_t) __builtin_neon_vcvtad_u64_f64(__p0); 48943 return __ret; 48944 } 48945 __ai __attribute__((target("neon"))) int32_t vcvtms_s32_f32(float32_t __p0) { 48946 int32_t __ret; 48947 __ret = (int32_t) __builtin_neon_vcvtms_s32_f32(__p0); 48948 return __ret; 48949 } 48950 #ifdef __LITTLE_ENDIAN__ 48951 __ai __attribute__((target("neon"))) int64x2_t vcvtmq_s64_f64(float64x2_t __p0) { 48952 int64x2_t __ret; 48953 __ret = (int64x2_t) __builtin_neon_vcvtmq_s64_v((int8x16_t)__p0, 35); 48954 return __ret; 48955 } 48956 #else 48957 __ai __attribute__((target("neon"))) int64x2_t vcvtmq_s64_f64(float64x2_t __p0) { 48958 int64x2_t __ret; 48959 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 48960 __ret = (int64x2_t) __builtin_neon_vcvtmq_s64_v((int8x16_t)__rev0, 35); 48961 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 48962 return __ret; 48963 } 48964 #endif 48965 48966 __ai __attribute__((target("neon"))) int64x1_t vcvtm_s64_f64(float64x1_t __p0) { 48967 int64x1_t __ret; 48968 __ret = (int64x1_t) __builtin_neon_vcvtm_s64_v((int8x8_t)__p0, 3); 48969 return __ret; 48970 } 48971 __ai __attribute__((target("neon"))) int64_t vcvtmd_s64_f64(float64_t __p0) { 48972 int64_t __ret; 48973 __ret = (int64_t) __builtin_neon_vcvtmd_s64_f64(__p0); 48974 return __ret; 48975 } 48976 __ai __attribute__((target("neon"))) uint32_t vcvtms_u32_f32(float32_t __p0) { 48977 uint32_t __ret; 48978 __ret = (uint32_t) __builtin_neon_vcvtms_u32_f32(__p0); 48979 return __ret; 48980 } 48981 #ifdef __LITTLE_ENDIAN__ 48982 __ai __attribute__((target("neon"))) uint64x2_t vcvtmq_u64_f64(float64x2_t __p0) { 48983 uint64x2_t __ret; 48984 __ret = (uint64x2_t) __builtin_neon_vcvtmq_u64_v((int8x16_t)__p0, 51); 48985 return __ret; 48986 } 48987 #else 48988 __ai __attribute__((target("neon"))) uint64x2_t vcvtmq_u64_f64(float64x2_t __p0) { 48989 uint64x2_t __ret; 48990 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 48991 __ret = (uint64x2_t) __builtin_neon_vcvtmq_u64_v((int8x16_t)__rev0, 51); 48992 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 48993 return __ret; 48994 } 48995 #endif 48996 48997 __ai __attribute__((target("neon"))) uint64x1_t vcvtm_u64_f64(float64x1_t __p0) { 48998 uint64x1_t __ret; 48999 __ret = (uint64x1_t) __builtin_neon_vcvtm_u64_v((int8x8_t)__p0, 19); 49000 return __ret; 49001 } 49002 __ai __attribute__((target("neon"))) uint64_t vcvtmd_u64_f64(float64_t __p0) { 49003 uint64_t __ret; 49004 __ret = (uint64_t) __builtin_neon_vcvtmd_u64_f64(__p0); 49005 return __ret; 49006 } 49007 __ai __attribute__((target("neon"))) int32_t vcvtns_s32_f32(float32_t __p0) { 49008 int32_t __ret; 49009 __ret = (int32_t) __builtin_neon_vcvtns_s32_f32(__p0); 49010 return __ret; 49011 } 49012 #ifdef __LITTLE_ENDIAN__ 49013 __ai __attribute__((target("neon"))) int64x2_t vcvtnq_s64_f64(float64x2_t __p0) { 49014 int64x2_t __ret; 49015 __ret = (int64x2_t) __builtin_neon_vcvtnq_s64_v((int8x16_t)__p0, 35); 49016 return __ret; 49017 } 49018 #else 49019 __ai __attribute__((target("neon"))) int64x2_t vcvtnq_s64_f64(float64x2_t __p0) { 49020 int64x2_t __ret; 49021 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 49022 __ret = (int64x2_t) __builtin_neon_vcvtnq_s64_v((int8x16_t)__rev0, 35); 49023 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 49024 return __ret; 49025 } 49026 #endif 49027 49028 __ai __attribute__((target("neon"))) int64x1_t vcvtn_s64_f64(float64x1_t __p0) { 49029 int64x1_t __ret; 49030 __ret = (int64x1_t) __builtin_neon_vcvtn_s64_v((int8x8_t)__p0, 3); 49031 return __ret; 49032 } 49033 __ai __attribute__((target("neon"))) int64_t vcvtnd_s64_f64(float64_t __p0) { 49034 int64_t __ret; 49035 __ret = (int64_t) __builtin_neon_vcvtnd_s64_f64(__p0); 49036 return __ret; 49037 } 49038 __ai __attribute__((target("neon"))) uint32_t vcvtns_u32_f32(float32_t __p0) { 49039 uint32_t __ret; 49040 __ret = (uint32_t) __builtin_neon_vcvtns_u32_f32(__p0); 49041 return __ret; 49042 } 49043 #ifdef __LITTLE_ENDIAN__ 49044 __ai __attribute__((target("neon"))) uint64x2_t vcvtnq_u64_f64(float64x2_t __p0) { 49045 uint64x2_t __ret; 49046 __ret = (uint64x2_t) __builtin_neon_vcvtnq_u64_v((int8x16_t)__p0, 51); 49047 return __ret; 49048 } 49049 #else 49050 __ai __attribute__((target("neon"))) uint64x2_t vcvtnq_u64_f64(float64x2_t __p0) { 49051 uint64x2_t __ret; 49052 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 49053 __ret = (uint64x2_t) __builtin_neon_vcvtnq_u64_v((int8x16_t)__rev0, 51); 49054 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 49055 return __ret; 49056 } 49057 #endif 49058 49059 __ai __attribute__((target("neon"))) uint64x1_t vcvtn_u64_f64(float64x1_t __p0) { 49060 uint64x1_t __ret; 49061 __ret = (uint64x1_t) __builtin_neon_vcvtn_u64_v((int8x8_t)__p0, 19); 49062 return __ret; 49063 } 49064 __ai __attribute__((target("neon"))) uint64_t vcvtnd_u64_f64(float64_t __p0) { 49065 uint64_t __ret; 49066 __ret = (uint64_t) __builtin_neon_vcvtnd_u64_f64(__p0); 49067 return __ret; 49068 } 49069 __ai __attribute__((target("neon"))) int32_t vcvtps_s32_f32(float32_t __p0) { 49070 int32_t __ret; 49071 __ret = (int32_t) __builtin_neon_vcvtps_s32_f32(__p0); 49072 return __ret; 49073 } 49074 #ifdef __LITTLE_ENDIAN__ 49075 __ai __attribute__((target("neon"))) int64x2_t vcvtpq_s64_f64(float64x2_t __p0) { 49076 int64x2_t __ret; 49077 __ret = (int64x2_t) __builtin_neon_vcvtpq_s64_v((int8x16_t)__p0, 35); 49078 return __ret; 49079 } 49080 #else 49081 __ai __attribute__((target("neon"))) int64x2_t vcvtpq_s64_f64(float64x2_t __p0) { 49082 int64x2_t __ret; 49083 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 49084 __ret = (int64x2_t) __builtin_neon_vcvtpq_s64_v((int8x16_t)__rev0, 35); 49085 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 49086 return __ret; 49087 } 49088 #endif 49089 49090 __ai __attribute__((target("neon"))) int64x1_t vcvtp_s64_f64(float64x1_t __p0) { 49091 int64x1_t __ret; 49092 __ret = (int64x1_t) __builtin_neon_vcvtp_s64_v((int8x8_t)__p0, 3); 49093 return __ret; 49094 } 49095 __ai __attribute__((target("neon"))) int64_t vcvtpd_s64_f64(float64_t __p0) { 49096 int64_t __ret; 49097 __ret = (int64_t) __builtin_neon_vcvtpd_s64_f64(__p0); 49098 return __ret; 49099 } 49100 __ai __attribute__((target("neon"))) uint32_t vcvtps_u32_f32(float32_t __p0) { 49101 uint32_t __ret; 49102 __ret = (uint32_t) __builtin_neon_vcvtps_u32_f32(__p0); 49103 return __ret; 49104 } 49105 #ifdef __LITTLE_ENDIAN__ 49106 __ai __attribute__((target("neon"))) uint64x2_t vcvtpq_u64_f64(float64x2_t __p0) { 49107 uint64x2_t __ret; 49108 __ret = (uint64x2_t) __builtin_neon_vcvtpq_u64_v((int8x16_t)__p0, 51); 49109 return __ret; 49110 } 49111 #else 49112 __ai __attribute__((target("neon"))) uint64x2_t vcvtpq_u64_f64(float64x2_t __p0) { 49113 uint64x2_t __ret; 49114 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 49115 __ret = (uint64x2_t) __builtin_neon_vcvtpq_u64_v((int8x16_t)__rev0, 51); 49116 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 49117 return __ret; 49118 } 49119 #endif 49120 49121 __ai __attribute__((target("neon"))) uint64x1_t vcvtp_u64_f64(float64x1_t __p0) { 49122 uint64x1_t __ret; 49123 __ret = (uint64x1_t) __builtin_neon_vcvtp_u64_v((int8x8_t)__p0, 19); 49124 return __ret; 49125 } 49126 __ai __attribute__((target("neon"))) uint64_t vcvtpd_u64_f64(float64_t __p0) { 49127 uint64_t __ret; 49128 __ret = (uint64_t) __builtin_neon_vcvtpd_u64_f64(__p0); 49129 return __ret; 49130 } 49131 __ai __attribute__((target("neon"))) float32_t vcvtxd_f32_f64(float64_t __p0) { 49132 float32_t __ret; 49133 __ret = (float32_t) __builtin_neon_vcvtxd_f32_f64(__p0); 49134 return __ret; 49135 } 49136 #ifdef __LITTLE_ENDIAN__ 49137 __ai __attribute__((target("neon"))) float32x2_t vcvtx_f32_f64(float64x2_t __p0) { 49138 float32x2_t __ret; 49139 __ret = (float32x2_t) __builtin_neon_vcvtx_f32_v((int8x16_t)__p0, 42); 49140 return __ret; 49141 } 49142 #else 49143 __ai __attribute__((target("neon"))) float32x2_t vcvtx_f32_f64(float64x2_t __p0) { 49144 float32x2_t __ret; 49145 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 49146 __ret = (float32x2_t) __builtin_neon_vcvtx_f32_v((int8x16_t)__rev0, 42); 49147 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 49148 return __ret; 49149 } 49150 __ai __attribute__((target("neon"))) float32x2_t __noswap_vcvtx_f32_f64(float64x2_t __p0) { 49151 float32x2_t __ret; 49152 __ret = (float32x2_t) __builtin_neon_vcvtx_f32_v((int8x16_t)__p0, 42); 49153 return __ret; 49154 } 49155 #endif 49156 49157 #ifdef __LITTLE_ENDIAN__ 49158 __ai __attribute__((target("neon"))) float32x4_t vcvtx_high_f32_f64(float32x2_t __p0, float64x2_t __p1) { 49159 float32x4_t __ret; 49160 __ret = vcombine_f32(__p0, vcvtx_f32_f64(__p1)); 49161 return __ret; 49162 } 49163 #else 49164 __ai __attribute__((target("neon"))) float32x4_t vcvtx_high_f32_f64(float32x2_t __p0, float64x2_t __p1) { 49165 float32x4_t __ret; 49166 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 49167 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 49168 __ret = __noswap_vcombine_f32(__rev0, __noswap_vcvtx_f32_f64(__rev1)); 49169 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 49170 return __ret; 49171 } 49172 #endif 49173 49174 #ifdef __LITTLE_ENDIAN__ 49175 __ai __attribute__((target("neon"))) float64x2_t vdivq_f64(float64x2_t __p0, float64x2_t __p1) { 49176 float64x2_t __ret; 49177 __ret = __p0 / __p1; 49178 return __ret; 49179 } 49180 #else 49181 __ai __attribute__((target("neon"))) float64x2_t vdivq_f64(float64x2_t __p0, float64x2_t __p1) { 49182 float64x2_t __ret; 49183 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 49184 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 49185 __ret = __rev0 / __rev1; 49186 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 49187 return __ret; 49188 } 49189 #endif 49190 49191 #ifdef __LITTLE_ENDIAN__ 49192 __ai __attribute__((target("neon"))) float32x4_t vdivq_f32(float32x4_t __p0, float32x4_t __p1) { 49193 float32x4_t __ret; 49194 __ret = __p0 / __p1; 49195 return __ret; 49196 } 49197 #else 49198 __ai __attribute__((target("neon"))) float32x4_t vdivq_f32(float32x4_t __p0, float32x4_t __p1) { 49199 float32x4_t __ret; 49200 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 49201 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 49202 __ret = __rev0 / __rev1; 49203 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 49204 return __ret; 49205 } 49206 #endif 49207 49208 __ai __attribute__((target("neon"))) float64x1_t vdiv_f64(float64x1_t __p0, float64x1_t __p1) { 49209 float64x1_t __ret; 49210 __ret = __p0 / __p1; 49211 return __ret; 49212 } 49213 #ifdef __LITTLE_ENDIAN__ 49214 __ai __attribute__((target("neon"))) float32x2_t vdiv_f32(float32x2_t __p0, float32x2_t __p1) { 49215 float32x2_t __ret; 49216 __ret = __p0 / __p1; 49217 return __ret; 49218 } 49219 #else 49220 __ai __attribute__((target("neon"))) float32x2_t vdiv_f32(float32x2_t __p0, float32x2_t __p1) { 49221 float32x2_t __ret; 49222 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 49223 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 49224 __ret = __rev0 / __rev1; 49225 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 49226 return __ret; 49227 } 49228 #endif 49229 49230 #ifdef __LITTLE_ENDIAN__ 49231 #define vdupb_lane_p8(__p0, __p1) __extension__ ({ \ 49232 poly8_t __ret; \ 49233 poly8x8_t __s0 = __p0; \ 49234 __ret = (poly8_t) __builtin_neon_vdupb_lane_i8((poly8x8_t)__s0, __p1); \ 49235 __ret; \ 49236 }) 49237 #else 49238 #define vdupb_lane_p8(__p0, __p1) __extension__ ({ \ 49239 poly8_t __ret; \ 49240 poly8x8_t __s0 = __p0; \ 49241 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 49242 __ret = (poly8_t) __builtin_neon_vdupb_lane_i8((poly8x8_t)__rev0, __p1); \ 49243 __ret; \ 49244 }) 49245 #endif 49246 49247 #ifdef __LITTLE_ENDIAN__ 49248 #define vduph_lane_p16(__p0, __p1) __extension__ ({ \ 49249 poly16_t __ret; \ 49250 poly16x4_t __s0 = __p0; \ 49251 __ret = (poly16_t) __builtin_neon_vduph_lane_i16((poly16x4_t)__s0, __p1); \ 49252 __ret; \ 49253 }) 49254 #else 49255 #define vduph_lane_p16(__p0, __p1) __extension__ ({ \ 49256 poly16_t __ret; \ 49257 poly16x4_t __s0 = __p0; \ 49258 poly16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 49259 __ret = (poly16_t) __builtin_neon_vduph_lane_i16((poly16x4_t)__rev0, __p1); \ 49260 __ret; \ 49261 }) 49262 #endif 49263 49264 #ifdef __LITTLE_ENDIAN__ 49265 #define vdupb_lane_u8(__p0, __p1) __extension__ ({ \ 49266 uint8_t __ret; \ 49267 uint8x8_t __s0 = __p0; \ 49268 __ret = (uint8_t) __builtin_neon_vdupb_lane_i8((int8x8_t)__s0, __p1); \ 49269 __ret; \ 49270 }) 49271 #else 49272 #define vdupb_lane_u8(__p0, __p1) __extension__ ({ \ 49273 uint8_t __ret; \ 49274 uint8x8_t __s0 = __p0; \ 49275 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 49276 __ret = (uint8_t) __builtin_neon_vdupb_lane_i8((int8x8_t)__rev0, __p1); \ 49277 __ret; \ 49278 }) 49279 #endif 49280 49281 #ifdef __LITTLE_ENDIAN__ 49282 #define vdups_lane_u32(__p0, __p1) __extension__ ({ \ 49283 uint32_t __ret; \ 49284 uint32x2_t __s0 = __p0; \ 49285 __ret = (uint32_t) __builtin_neon_vdups_lane_i32((int32x2_t)__s0, __p1); \ 49286 __ret; \ 49287 }) 49288 #else 49289 #define vdups_lane_u32(__p0, __p1) __extension__ ({ \ 49290 uint32_t __ret; \ 49291 uint32x2_t __s0 = __p0; \ 49292 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 49293 __ret = (uint32_t) __builtin_neon_vdups_lane_i32((int32x2_t)__rev0, __p1); \ 49294 __ret; \ 49295 }) 49296 #endif 49297 49298 #define vdupd_lane_u64(__p0, __p1) __extension__ ({ \ 49299 uint64_t __ret; \ 49300 uint64x1_t __s0 = __p0; \ 49301 __ret = (uint64_t) __builtin_neon_vdupd_lane_i64((int64x1_t)__s0, __p1); \ 49302 __ret; \ 49303 }) 49304 #ifdef __LITTLE_ENDIAN__ 49305 #define vduph_lane_u16(__p0, __p1) __extension__ ({ \ 49306 uint16_t __ret; \ 49307 uint16x4_t __s0 = __p0; \ 49308 __ret = (uint16_t) __builtin_neon_vduph_lane_i16((int16x4_t)__s0, __p1); \ 49309 __ret; \ 49310 }) 49311 #else 49312 #define vduph_lane_u16(__p0, __p1) __extension__ ({ \ 49313 uint16_t __ret; \ 49314 uint16x4_t __s0 = __p0; \ 49315 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 49316 __ret = (uint16_t) __builtin_neon_vduph_lane_i16((int16x4_t)__rev0, __p1); \ 49317 __ret; \ 49318 }) 49319 #endif 49320 49321 #ifdef __LITTLE_ENDIAN__ 49322 #define vdupb_lane_s8(__p0, __p1) __extension__ ({ \ 49323 int8_t __ret; \ 49324 int8x8_t __s0 = __p0; \ 49325 __ret = (int8_t) __builtin_neon_vdupb_lane_i8((int8x8_t)__s0, __p1); \ 49326 __ret; \ 49327 }) 49328 #else 49329 #define vdupb_lane_s8(__p0, __p1) __extension__ ({ \ 49330 int8_t __ret; \ 49331 int8x8_t __s0 = __p0; \ 49332 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 49333 __ret = (int8_t) __builtin_neon_vdupb_lane_i8((int8x8_t)__rev0, __p1); \ 49334 __ret; \ 49335 }) 49336 #endif 49337 49338 #define vdupd_lane_f64(__p0, __p1) __extension__ ({ \ 49339 float64_t __ret; \ 49340 float64x1_t __s0 = __p0; \ 49341 __ret = (float64_t) __builtin_neon_vdupd_lane_f64((float64x1_t)__s0, __p1); \ 49342 __ret; \ 49343 }) 49344 #ifdef __LITTLE_ENDIAN__ 49345 #define vdups_lane_f32(__p0, __p1) __extension__ ({ \ 49346 float32_t __ret; \ 49347 float32x2_t __s0 = __p0; \ 49348 __ret = (float32_t) __builtin_neon_vdups_lane_f32((float32x2_t)__s0, __p1); \ 49349 __ret; \ 49350 }) 49351 #else 49352 #define vdups_lane_f32(__p0, __p1) __extension__ ({ \ 49353 float32_t __ret; \ 49354 float32x2_t __s0 = __p0; \ 49355 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 49356 __ret = (float32_t) __builtin_neon_vdups_lane_f32((float32x2_t)__rev0, __p1); \ 49357 __ret; \ 49358 }) 49359 #endif 49360 49361 #ifdef __LITTLE_ENDIAN__ 49362 #define vdups_lane_s32(__p0, __p1) __extension__ ({ \ 49363 int32_t __ret; \ 49364 int32x2_t __s0 = __p0; \ 49365 __ret = (int32_t) __builtin_neon_vdups_lane_i32((int32x2_t)__s0, __p1); \ 49366 __ret; \ 49367 }) 49368 #else 49369 #define vdups_lane_s32(__p0, __p1) __extension__ ({ \ 49370 int32_t __ret; \ 49371 int32x2_t __s0 = __p0; \ 49372 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 49373 __ret = (int32_t) __builtin_neon_vdups_lane_i32((int32x2_t)__rev0, __p1); \ 49374 __ret; \ 49375 }) 49376 #endif 49377 49378 #define vdupd_lane_s64(__p0, __p1) __extension__ ({ \ 49379 int64_t __ret; \ 49380 int64x1_t __s0 = __p0; \ 49381 __ret = (int64_t) __builtin_neon_vdupd_lane_i64((int64x1_t)__s0, __p1); \ 49382 __ret; \ 49383 }) 49384 #ifdef __LITTLE_ENDIAN__ 49385 #define vduph_lane_s16(__p0, __p1) __extension__ ({ \ 49386 int16_t __ret; \ 49387 int16x4_t __s0 = __p0; \ 49388 __ret = (int16_t) __builtin_neon_vduph_lane_i16((int16x4_t)__s0, __p1); \ 49389 __ret; \ 49390 }) 49391 #else 49392 #define vduph_lane_s16(__p0, __p1) __extension__ ({ \ 49393 int16_t __ret; \ 49394 int16x4_t __s0 = __p0; \ 49395 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 49396 __ret = (int16_t) __builtin_neon_vduph_lane_i16((int16x4_t)__rev0, __p1); \ 49397 __ret; \ 49398 }) 49399 #endif 49400 49401 #ifdef __LITTLE_ENDIAN__ 49402 #define vduph_lane_f16(__p0, __p1) __extension__ ({ \ 49403 float16_t __ret; \ 49404 float16x4_t __s0 = __p0; \ 49405 __ret = (float16_t) __builtin_neon_vduph_lane_f16((float16x4_t)__s0, __p1); \ 49406 __ret; \ 49407 }) 49408 #else 49409 #define vduph_lane_f16(__p0, __p1) __extension__ ({ \ 49410 float16_t __ret; \ 49411 float16x4_t __s0 = __p0; \ 49412 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 49413 __ret = (float16_t) __builtin_neon_vduph_lane_f16((float16x4_t)__rev0, __p1); \ 49414 __ret; \ 49415 }) 49416 #endif 49417 49418 #define vdup_lane_p64(__p0_364, __p1_364) __extension__ ({ \ 49419 poly64x1_t __ret_364; \ 49420 poly64x1_t __s0_364 = __p0_364; \ 49421 __ret_364 = splat_lane_p64(__s0_364, __p1_364); \ 49422 __ret_364; \ 49423 }) 49424 #ifdef __LITTLE_ENDIAN__ 49425 #define vdupq_lane_p64(__p0_365, __p1_365) __extension__ ({ \ 49426 poly64x2_t __ret_365; \ 49427 poly64x1_t __s0_365 = __p0_365; \ 49428 __ret_365 = splatq_lane_p64(__s0_365, __p1_365); \ 49429 __ret_365; \ 49430 }) 49431 #else 49432 #define vdupq_lane_p64(__p0_366, __p1_366) __extension__ ({ \ 49433 poly64x2_t __ret_366; \ 49434 poly64x1_t __s0_366 = __p0_366; \ 49435 __ret_366 = __noswap_splatq_lane_p64(__s0_366, __p1_366); \ 49436 __ret_366 = __builtin_shufflevector(__ret_366, __ret_366, 1, 0); \ 49437 __ret_366; \ 49438 }) 49439 #endif 49440 49441 #ifdef __LITTLE_ENDIAN__ 49442 #define vdupq_lane_f64(__p0_367, __p1_367) __extension__ ({ \ 49443 float64x2_t __ret_367; \ 49444 float64x1_t __s0_367 = __p0_367; \ 49445 __ret_367 = splatq_lane_f64(__s0_367, __p1_367); \ 49446 __ret_367; \ 49447 }) 49448 #else 49449 #define vdupq_lane_f64(__p0_368, __p1_368) __extension__ ({ \ 49450 float64x2_t __ret_368; \ 49451 float64x1_t __s0_368 = __p0_368; \ 49452 __ret_368 = __noswap_splatq_lane_f64(__s0_368, __p1_368); \ 49453 __ret_368 = __builtin_shufflevector(__ret_368, __ret_368, 1, 0); \ 49454 __ret_368; \ 49455 }) 49456 #endif 49457 49458 #define vdup_lane_f64(__p0_369, __p1_369) __extension__ ({ \ 49459 float64x1_t __ret_369; \ 49460 float64x1_t __s0_369 = __p0_369; \ 49461 __ret_369 = splat_lane_f64(__s0_369, __p1_369); \ 49462 __ret_369; \ 49463 }) 49464 #ifdef __LITTLE_ENDIAN__ 49465 #define vdupb_laneq_p8(__p0, __p1) __extension__ ({ \ 49466 poly8_t __ret; \ 49467 poly8x16_t __s0 = __p0; \ 49468 __ret = (poly8_t) __builtin_neon_vdupb_laneq_i8((poly8x16_t)__s0, __p1); \ 49469 __ret; \ 49470 }) 49471 #else 49472 #define vdupb_laneq_p8(__p0, __p1) __extension__ ({ \ 49473 poly8_t __ret; \ 49474 poly8x16_t __s0 = __p0; \ 49475 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 49476 __ret = (poly8_t) __builtin_neon_vdupb_laneq_i8((poly8x16_t)__rev0, __p1); \ 49477 __ret; \ 49478 }) 49479 #endif 49480 49481 #ifdef __LITTLE_ENDIAN__ 49482 #define vduph_laneq_p16(__p0, __p1) __extension__ ({ \ 49483 poly16_t __ret; \ 49484 poly16x8_t __s0 = __p0; \ 49485 __ret = (poly16_t) __builtin_neon_vduph_laneq_i16((poly16x8_t)__s0, __p1); \ 49486 __ret; \ 49487 }) 49488 #else 49489 #define vduph_laneq_p16(__p0, __p1) __extension__ ({ \ 49490 poly16_t __ret; \ 49491 poly16x8_t __s0 = __p0; \ 49492 poly16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 49493 __ret = (poly16_t) __builtin_neon_vduph_laneq_i16((poly16x8_t)__rev0, __p1); \ 49494 __ret; \ 49495 }) 49496 #endif 49497 49498 #ifdef __LITTLE_ENDIAN__ 49499 #define vdupb_laneq_u8(__p0, __p1) __extension__ ({ \ 49500 uint8_t __ret; \ 49501 uint8x16_t __s0 = __p0; \ 49502 __ret = (uint8_t) __builtin_neon_vdupb_laneq_i8((int8x16_t)__s0, __p1); \ 49503 __ret; \ 49504 }) 49505 #else 49506 #define vdupb_laneq_u8(__p0, __p1) __extension__ ({ \ 49507 uint8_t __ret; \ 49508 uint8x16_t __s0 = __p0; \ 49509 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 49510 __ret = (uint8_t) __builtin_neon_vdupb_laneq_i8((int8x16_t)__rev0, __p1); \ 49511 __ret; \ 49512 }) 49513 #endif 49514 49515 #ifdef __LITTLE_ENDIAN__ 49516 #define vdups_laneq_u32(__p0, __p1) __extension__ ({ \ 49517 uint32_t __ret; \ 49518 uint32x4_t __s0 = __p0; \ 49519 __ret = (uint32_t) __builtin_neon_vdups_laneq_i32((int32x4_t)__s0, __p1); \ 49520 __ret; \ 49521 }) 49522 #else 49523 #define vdups_laneq_u32(__p0, __p1) __extension__ ({ \ 49524 uint32_t __ret; \ 49525 uint32x4_t __s0 = __p0; \ 49526 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 49527 __ret = (uint32_t) __builtin_neon_vdups_laneq_i32((int32x4_t)__rev0, __p1); \ 49528 __ret; \ 49529 }) 49530 #endif 49531 49532 #ifdef __LITTLE_ENDIAN__ 49533 #define vdupd_laneq_u64(__p0, __p1) __extension__ ({ \ 49534 uint64_t __ret; \ 49535 uint64x2_t __s0 = __p0; \ 49536 __ret = (uint64_t) __builtin_neon_vdupd_laneq_i64((int64x2_t)__s0, __p1); \ 49537 __ret; \ 49538 }) 49539 #else 49540 #define vdupd_laneq_u64(__p0, __p1) __extension__ ({ \ 49541 uint64_t __ret; \ 49542 uint64x2_t __s0 = __p0; \ 49543 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 49544 __ret = (uint64_t) __builtin_neon_vdupd_laneq_i64((int64x2_t)__rev0, __p1); \ 49545 __ret; \ 49546 }) 49547 #endif 49548 49549 #ifdef __LITTLE_ENDIAN__ 49550 #define vduph_laneq_u16(__p0, __p1) __extension__ ({ \ 49551 uint16_t __ret; \ 49552 uint16x8_t __s0 = __p0; \ 49553 __ret = (uint16_t) __builtin_neon_vduph_laneq_i16((int16x8_t)__s0, __p1); \ 49554 __ret; \ 49555 }) 49556 #else 49557 #define vduph_laneq_u16(__p0, __p1) __extension__ ({ \ 49558 uint16_t __ret; \ 49559 uint16x8_t __s0 = __p0; \ 49560 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 49561 __ret = (uint16_t) __builtin_neon_vduph_laneq_i16((int16x8_t)__rev0, __p1); \ 49562 __ret; \ 49563 }) 49564 #endif 49565 49566 #ifdef __LITTLE_ENDIAN__ 49567 #define vdupb_laneq_s8(__p0, __p1) __extension__ ({ \ 49568 int8_t __ret; \ 49569 int8x16_t __s0 = __p0; \ 49570 __ret = (int8_t) __builtin_neon_vdupb_laneq_i8((int8x16_t)__s0, __p1); \ 49571 __ret; \ 49572 }) 49573 #else 49574 #define vdupb_laneq_s8(__p0, __p1) __extension__ ({ \ 49575 int8_t __ret; \ 49576 int8x16_t __s0 = __p0; \ 49577 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 49578 __ret = (int8_t) __builtin_neon_vdupb_laneq_i8((int8x16_t)__rev0, __p1); \ 49579 __ret; \ 49580 }) 49581 #endif 49582 49583 #ifdef __LITTLE_ENDIAN__ 49584 #define vdupd_laneq_f64(__p0, __p1) __extension__ ({ \ 49585 float64_t __ret; \ 49586 float64x2_t __s0 = __p0; \ 49587 __ret = (float64_t) __builtin_neon_vdupd_laneq_f64((float64x2_t)__s0, __p1); \ 49588 __ret; \ 49589 }) 49590 #else 49591 #define vdupd_laneq_f64(__p0, __p1) __extension__ ({ \ 49592 float64_t __ret; \ 49593 float64x2_t __s0 = __p0; \ 49594 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 49595 __ret = (float64_t) __builtin_neon_vdupd_laneq_f64((float64x2_t)__rev0, __p1); \ 49596 __ret; \ 49597 }) 49598 #endif 49599 49600 #ifdef __LITTLE_ENDIAN__ 49601 #define vdups_laneq_f32(__p0, __p1) __extension__ ({ \ 49602 float32_t __ret; \ 49603 float32x4_t __s0 = __p0; \ 49604 __ret = (float32_t) __builtin_neon_vdups_laneq_f32((float32x4_t)__s0, __p1); \ 49605 __ret; \ 49606 }) 49607 #else 49608 #define vdups_laneq_f32(__p0, __p1) __extension__ ({ \ 49609 float32_t __ret; \ 49610 float32x4_t __s0 = __p0; \ 49611 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 49612 __ret = (float32_t) __builtin_neon_vdups_laneq_f32((float32x4_t)__rev0, __p1); \ 49613 __ret; \ 49614 }) 49615 #endif 49616 49617 #ifdef __LITTLE_ENDIAN__ 49618 #define vdups_laneq_s32(__p0, __p1) __extension__ ({ \ 49619 int32_t __ret; \ 49620 int32x4_t __s0 = __p0; \ 49621 __ret = (int32_t) __builtin_neon_vdups_laneq_i32((int32x4_t)__s0, __p1); \ 49622 __ret; \ 49623 }) 49624 #else 49625 #define vdups_laneq_s32(__p0, __p1) __extension__ ({ \ 49626 int32_t __ret; \ 49627 int32x4_t __s0 = __p0; \ 49628 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 49629 __ret = (int32_t) __builtin_neon_vdups_laneq_i32((int32x4_t)__rev0, __p1); \ 49630 __ret; \ 49631 }) 49632 #endif 49633 49634 #ifdef __LITTLE_ENDIAN__ 49635 #define vdupd_laneq_s64(__p0, __p1) __extension__ ({ \ 49636 int64_t __ret; \ 49637 int64x2_t __s0 = __p0; \ 49638 __ret = (int64_t) __builtin_neon_vdupd_laneq_i64((int64x2_t)__s0, __p1); \ 49639 __ret; \ 49640 }) 49641 #else 49642 #define vdupd_laneq_s64(__p0, __p1) __extension__ ({ \ 49643 int64_t __ret; \ 49644 int64x2_t __s0 = __p0; \ 49645 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 49646 __ret = (int64_t) __builtin_neon_vdupd_laneq_i64((int64x2_t)__rev0, __p1); \ 49647 __ret; \ 49648 }) 49649 #endif 49650 49651 #ifdef __LITTLE_ENDIAN__ 49652 #define vduph_laneq_s16(__p0, __p1) __extension__ ({ \ 49653 int16_t __ret; \ 49654 int16x8_t __s0 = __p0; \ 49655 __ret = (int16_t) __builtin_neon_vduph_laneq_i16((int16x8_t)__s0, __p1); \ 49656 __ret; \ 49657 }) 49658 #else 49659 #define vduph_laneq_s16(__p0, __p1) __extension__ ({ \ 49660 int16_t __ret; \ 49661 int16x8_t __s0 = __p0; \ 49662 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 49663 __ret = (int16_t) __builtin_neon_vduph_laneq_i16((int16x8_t)__rev0, __p1); \ 49664 __ret; \ 49665 }) 49666 #endif 49667 49668 #ifdef __LITTLE_ENDIAN__ 49669 #define vduph_laneq_f16(__p0, __p1) __extension__ ({ \ 49670 float16_t __ret; \ 49671 float16x8_t __s0 = __p0; \ 49672 __ret = (float16_t) __builtin_neon_vduph_laneq_f16((float16x8_t)__s0, __p1); \ 49673 __ret; \ 49674 }) 49675 #else 49676 #define vduph_laneq_f16(__p0, __p1) __extension__ ({ \ 49677 float16_t __ret; \ 49678 float16x8_t __s0 = __p0; \ 49679 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 49680 __ret = (float16_t) __builtin_neon_vduph_laneq_f16((float16x8_t)__rev0, __p1); \ 49681 __ret; \ 49682 }) 49683 #endif 49684 49685 #ifdef __LITTLE_ENDIAN__ 49686 #define vdup_laneq_p8(__p0_370, __p1_370) __extension__ ({ \ 49687 poly8x8_t __ret_370; \ 49688 poly8x16_t __s0_370 = __p0_370; \ 49689 __ret_370 = splat_laneq_p8(__s0_370, __p1_370); \ 49690 __ret_370; \ 49691 }) 49692 #else 49693 #define vdup_laneq_p8(__p0_371, __p1_371) __extension__ ({ \ 49694 poly8x8_t __ret_371; \ 49695 poly8x16_t __s0_371 = __p0_371; \ 49696 poly8x16_t __rev0_371; __rev0_371 = __builtin_shufflevector(__s0_371, __s0_371, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 49697 __ret_371 = __noswap_splat_laneq_p8(__rev0_371, __p1_371); \ 49698 __ret_371 = __builtin_shufflevector(__ret_371, __ret_371, 7, 6, 5, 4, 3, 2, 1, 0); \ 49699 __ret_371; \ 49700 }) 49701 #endif 49702 49703 #ifdef __LITTLE_ENDIAN__ 49704 #define vdup_laneq_p64(__p0_372, __p1_372) __extension__ ({ \ 49705 poly64x1_t __ret_372; \ 49706 poly64x2_t __s0_372 = __p0_372; \ 49707 __ret_372 = splat_laneq_p64(__s0_372, __p1_372); \ 49708 __ret_372; \ 49709 }) 49710 #else 49711 #define vdup_laneq_p64(__p0_373, __p1_373) __extension__ ({ \ 49712 poly64x1_t __ret_373; \ 49713 poly64x2_t __s0_373 = __p0_373; \ 49714 poly64x2_t __rev0_373; __rev0_373 = __builtin_shufflevector(__s0_373, __s0_373, 1, 0); \ 49715 __ret_373 = __noswap_splat_laneq_p64(__rev0_373, __p1_373); \ 49716 __ret_373; \ 49717 }) 49718 #endif 49719 49720 #ifdef __LITTLE_ENDIAN__ 49721 #define vdup_laneq_p16(__p0_374, __p1_374) __extension__ ({ \ 49722 poly16x4_t __ret_374; \ 49723 poly16x8_t __s0_374 = __p0_374; \ 49724 __ret_374 = splat_laneq_p16(__s0_374, __p1_374); \ 49725 __ret_374; \ 49726 }) 49727 #else 49728 #define vdup_laneq_p16(__p0_375, __p1_375) __extension__ ({ \ 49729 poly16x4_t __ret_375; \ 49730 poly16x8_t __s0_375 = __p0_375; \ 49731 poly16x8_t __rev0_375; __rev0_375 = __builtin_shufflevector(__s0_375, __s0_375, 7, 6, 5, 4, 3, 2, 1, 0); \ 49732 __ret_375 = __noswap_splat_laneq_p16(__rev0_375, __p1_375); \ 49733 __ret_375 = __builtin_shufflevector(__ret_375, __ret_375, 3, 2, 1, 0); \ 49734 __ret_375; \ 49735 }) 49736 #endif 49737 49738 #ifdef __LITTLE_ENDIAN__ 49739 #define vdupq_laneq_p8(__p0_376, __p1_376) __extension__ ({ \ 49740 poly8x16_t __ret_376; \ 49741 poly8x16_t __s0_376 = __p0_376; \ 49742 __ret_376 = splatq_laneq_p8(__s0_376, __p1_376); \ 49743 __ret_376; \ 49744 }) 49745 #else 49746 #define vdupq_laneq_p8(__p0_377, __p1_377) __extension__ ({ \ 49747 poly8x16_t __ret_377; \ 49748 poly8x16_t __s0_377 = __p0_377; \ 49749 poly8x16_t __rev0_377; __rev0_377 = __builtin_shufflevector(__s0_377, __s0_377, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 49750 __ret_377 = __noswap_splatq_laneq_p8(__rev0_377, __p1_377); \ 49751 __ret_377 = __builtin_shufflevector(__ret_377, __ret_377, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 49752 __ret_377; \ 49753 }) 49754 #endif 49755 49756 #ifdef __LITTLE_ENDIAN__ 49757 #define vdupq_laneq_p64(__p0_378, __p1_378) __extension__ ({ \ 49758 poly64x2_t __ret_378; \ 49759 poly64x2_t __s0_378 = __p0_378; \ 49760 __ret_378 = splatq_laneq_p64(__s0_378, __p1_378); \ 49761 __ret_378; \ 49762 }) 49763 #else 49764 #define vdupq_laneq_p64(__p0_379, __p1_379) __extension__ ({ \ 49765 poly64x2_t __ret_379; \ 49766 poly64x2_t __s0_379 = __p0_379; \ 49767 poly64x2_t __rev0_379; __rev0_379 = __builtin_shufflevector(__s0_379, __s0_379, 1, 0); \ 49768 __ret_379 = __noswap_splatq_laneq_p64(__rev0_379, __p1_379); \ 49769 __ret_379 = __builtin_shufflevector(__ret_379, __ret_379, 1, 0); \ 49770 __ret_379; \ 49771 }) 49772 #endif 49773 49774 #ifdef __LITTLE_ENDIAN__ 49775 #define vdupq_laneq_p16(__p0_380, __p1_380) __extension__ ({ \ 49776 poly16x8_t __ret_380; \ 49777 poly16x8_t __s0_380 = __p0_380; \ 49778 __ret_380 = splatq_laneq_p16(__s0_380, __p1_380); \ 49779 __ret_380; \ 49780 }) 49781 #else 49782 #define vdupq_laneq_p16(__p0_381, __p1_381) __extension__ ({ \ 49783 poly16x8_t __ret_381; \ 49784 poly16x8_t __s0_381 = __p0_381; \ 49785 poly16x8_t __rev0_381; __rev0_381 = __builtin_shufflevector(__s0_381, __s0_381, 7, 6, 5, 4, 3, 2, 1, 0); \ 49786 __ret_381 = __noswap_splatq_laneq_p16(__rev0_381, __p1_381); \ 49787 __ret_381 = __builtin_shufflevector(__ret_381, __ret_381, 7, 6, 5, 4, 3, 2, 1, 0); \ 49788 __ret_381; \ 49789 }) 49790 #endif 49791 49792 #ifdef __LITTLE_ENDIAN__ 49793 #define vdupq_laneq_u8(__p0_382, __p1_382) __extension__ ({ \ 49794 uint8x16_t __ret_382; \ 49795 uint8x16_t __s0_382 = __p0_382; \ 49796 __ret_382 = splatq_laneq_u8(__s0_382, __p1_382); \ 49797 __ret_382; \ 49798 }) 49799 #else 49800 #define vdupq_laneq_u8(__p0_383, __p1_383) __extension__ ({ \ 49801 uint8x16_t __ret_383; \ 49802 uint8x16_t __s0_383 = __p0_383; \ 49803 uint8x16_t __rev0_383; __rev0_383 = __builtin_shufflevector(__s0_383, __s0_383, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 49804 __ret_383 = __noswap_splatq_laneq_u8(__rev0_383, __p1_383); \ 49805 __ret_383 = __builtin_shufflevector(__ret_383, __ret_383, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 49806 __ret_383; \ 49807 }) 49808 #endif 49809 49810 #ifdef __LITTLE_ENDIAN__ 49811 #define vdupq_laneq_u32(__p0_384, __p1_384) __extension__ ({ \ 49812 uint32x4_t __ret_384; \ 49813 uint32x4_t __s0_384 = __p0_384; \ 49814 __ret_384 = splatq_laneq_u32(__s0_384, __p1_384); \ 49815 __ret_384; \ 49816 }) 49817 #else 49818 #define vdupq_laneq_u32(__p0_385, __p1_385) __extension__ ({ \ 49819 uint32x4_t __ret_385; \ 49820 uint32x4_t __s0_385 = __p0_385; \ 49821 uint32x4_t __rev0_385; __rev0_385 = __builtin_shufflevector(__s0_385, __s0_385, 3, 2, 1, 0); \ 49822 __ret_385 = __noswap_splatq_laneq_u32(__rev0_385, __p1_385); \ 49823 __ret_385 = __builtin_shufflevector(__ret_385, __ret_385, 3, 2, 1, 0); \ 49824 __ret_385; \ 49825 }) 49826 #endif 49827 49828 #ifdef __LITTLE_ENDIAN__ 49829 #define vdupq_laneq_u64(__p0_386, __p1_386) __extension__ ({ \ 49830 uint64x2_t __ret_386; \ 49831 uint64x2_t __s0_386 = __p0_386; \ 49832 __ret_386 = splatq_laneq_u64(__s0_386, __p1_386); \ 49833 __ret_386; \ 49834 }) 49835 #else 49836 #define vdupq_laneq_u64(__p0_387, __p1_387) __extension__ ({ \ 49837 uint64x2_t __ret_387; \ 49838 uint64x2_t __s0_387 = __p0_387; \ 49839 uint64x2_t __rev0_387; __rev0_387 = __builtin_shufflevector(__s0_387, __s0_387, 1, 0); \ 49840 __ret_387 = __noswap_splatq_laneq_u64(__rev0_387, __p1_387); \ 49841 __ret_387 = __builtin_shufflevector(__ret_387, __ret_387, 1, 0); \ 49842 __ret_387; \ 49843 }) 49844 #endif 49845 49846 #ifdef __LITTLE_ENDIAN__ 49847 #define vdupq_laneq_u16(__p0_388, __p1_388) __extension__ ({ \ 49848 uint16x8_t __ret_388; \ 49849 uint16x8_t __s0_388 = __p0_388; \ 49850 __ret_388 = splatq_laneq_u16(__s0_388, __p1_388); \ 49851 __ret_388; \ 49852 }) 49853 #else 49854 #define vdupq_laneq_u16(__p0_389, __p1_389) __extension__ ({ \ 49855 uint16x8_t __ret_389; \ 49856 uint16x8_t __s0_389 = __p0_389; \ 49857 uint16x8_t __rev0_389; __rev0_389 = __builtin_shufflevector(__s0_389, __s0_389, 7, 6, 5, 4, 3, 2, 1, 0); \ 49858 __ret_389 = __noswap_splatq_laneq_u16(__rev0_389, __p1_389); \ 49859 __ret_389 = __builtin_shufflevector(__ret_389, __ret_389, 7, 6, 5, 4, 3, 2, 1, 0); \ 49860 __ret_389; \ 49861 }) 49862 #endif 49863 49864 #ifdef __LITTLE_ENDIAN__ 49865 #define vdupq_laneq_s8(__p0_390, __p1_390) __extension__ ({ \ 49866 int8x16_t __ret_390; \ 49867 int8x16_t __s0_390 = __p0_390; \ 49868 __ret_390 = splatq_laneq_s8(__s0_390, __p1_390); \ 49869 __ret_390; \ 49870 }) 49871 #else 49872 #define vdupq_laneq_s8(__p0_391, __p1_391) __extension__ ({ \ 49873 int8x16_t __ret_391; \ 49874 int8x16_t __s0_391 = __p0_391; \ 49875 int8x16_t __rev0_391; __rev0_391 = __builtin_shufflevector(__s0_391, __s0_391, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 49876 __ret_391 = __noswap_splatq_laneq_s8(__rev0_391, __p1_391); \ 49877 __ret_391 = __builtin_shufflevector(__ret_391, __ret_391, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 49878 __ret_391; \ 49879 }) 49880 #endif 49881 49882 #ifdef __LITTLE_ENDIAN__ 49883 #define vdupq_laneq_f64(__p0_392, __p1_392) __extension__ ({ \ 49884 float64x2_t __ret_392; \ 49885 float64x2_t __s0_392 = __p0_392; \ 49886 __ret_392 = splatq_laneq_f64(__s0_392, __p1_392); \ 49887 __ret_392; \ 49888 }) 49889 #else 49890 #define vdupq_laneq_f64(__p0_393, __p1_393) __extension__ ({ \ 49891 float64x2_t __ret_393; \ 49892 float64x2_t __s0_393 = __p0_393; \ 49893 float64x2_t __rev0_393; __rev0_393 = __builtin_shufflevector(__s0_393, __s0_393, 1, 0); \ 49894 __ret_393 = __noswap_splatq_laneq_f64(__rev0_393, __p1_393); \ 49895 __ret_393 = __builtin_shufflevector(__ret_393, __ret_393, 1, 0); \ 49896 __ret_393; \ 49897 }) 49898 #endif 49899 49900 #ifdef __LITTLE_ENDIAN__ 49901 #define vdupq_laneq_f32(__p0_394, __p1_394) __extension__ ({ \ 49902 float32x4_t __ret_394; \ 49903 float32x4_t __s0_394 = __p0_394; \ 49904 __ret_394 = splatq_laneq_f32(__s0_394, __p1_394); \ 49905 __ret_394; \ 49906 }) 49907 #else 49908 #define vdupq_laneq_f32(__p0_395, __p1_395) __extension__ ({ \ 49909 float32x4_t __ret_395; \ 49910 float32x4_t __s0_395 = __p0_395; \ 49911 float32x4_t __rev0_395; __rev0_395 = __builtin_shufflevector(__s0_395, __s0_395, 3, 2, 1, 0); \ 49912 __ret_395 = __noswap_splatq_laneq_f32(__rev0_395, __p1_395); \ 49913 __ret_395 = __builtin_shufflevector(__ret_395, __ret_395, 3, 2, 1, 0); \ 49914 __ret_395; \ 49915 }) 49916 #endif 49917 49918 #ifdef __LITTLE_ENDIAN__ 49919 #define vdupq_laneq_f16(__p0_396, __p1_396) __extension__ ({ \ 49920 float16x8_t __ret_396; \ 49921 float16x8_t __s0_396 = __p0_396; \ 49922 __ret_396 = splatq_laneq_f16(__s0_396, __p1_396); \ 49923 __ret_396; \ 49924 }) 49925 #else 49926 #define vdupq_laneq_f16(__p0_397, __p1_397) __extension__ ({ \ 49927 float16x8_t __ret_397; \ 49928 float16x8_t __s0_397 = __p0_397; \ 49929 float16x8_t __rev0_397; __rev0_397 = __builtin_shufflevector(__s0_397, __s0_397, 7, 6, 5, 4, 3, 2, 1, 0); \ 49930 __ret_397 = __noswap_splatq_laneq_f16(__rev0_397, __p1_397); \ 49931 __ret_397 = __builtin_shufflevector(__ret_397, __ret_397, 7, 6, 5, 4, 3, 2, 1, 0); \ 49932 __ret_397; \ 49933 }) 49934 #endif 49935 49936 #ifdef __LITTLE_ENDIAN__ 49937 #define vdupq_laneq_s32(__p0_398, __p1_398) __extension__ ({ \ 49938 int32x4_t __ret_398; \ 49939 int32x4_t __s0_398 = __p0_398; \ 49940 __ret_398 = splatq_laneq_s32(__s0_398, __p1_398); \ 49941 __ret_398; \ 49942 }) 49943 #else 49944 #define vdupq_laneq_s32(__p0_399, __p1_399) __extension__ ({ \ 49945 int32x4_t __ret_399; \ 49946 int32x4_t __s0_399 = __p0_399; \ 49947 int32x4_t __rev0_399; __rev0_399 = __builtin_shufflevector(__s0_399, __s0_399, 3, 2, 1, 0); \ 49948 __ret_399 = __noswap_splatq_laneq_s32(__rev0_399, __p1_399); \ 49949 __ret_399 = __builtin_shufflevector(__ret_399, __ret_399, 3, 2, 1, 0); \ 49950 __ret_399; \ 49951 }) 49952 #endif 49953 49954 #ifdef __LITTLE_ENDIAN__ 49955 #define vdupq_laneq_s64(__p0_400, __p1_400) __extension__ ({ \ 49956 int64x2_t __ret_400; \ 49957 int64x2_t __s0_400 = __p0_400; \ 49958 __ret_400 = splatq_laneq_s64(__s0_400, __p1_400); \ 49959 __ret_400; \ 49960 }) 49961 #else 49962 #define vdupq_laneq_s64(__p0_401, __p1_401) __extension__ ({ \ 49963 int64x2_t __ret_401; \ 49964 int64x2_t __s0_401 = __p0_401; \ 49965 int64x2_t __rev0_401; __rev0_401 = __builtin_shufflevector(__s0_401, __s0_401, 1, 0); \ 49966 __ret_401 = __noswap_splatq_laneq_s64(__rev0_401, __p1_401); \ 49967 __ret_401 = __builtin_shufflevector(__ret_401, __ret_401, 1, 0); \ 49968 __ret_401; \ 49969 }) 49970 #endif 49971 49972 #ifdef __LITTLE_ENDIAN__ 49973 #define vdupq_laneq_s16(__p0_402, __p1_402) __extension__ ({ \ 49974 int16x8_t __ret_402; \ 49975 int16x8_t __s0_402 = __p0_402; \ 49976 __ret_402 = splatq_laneq_s16(__s0_402, __p1_402); \ 49977 __ret_402; \ 49978 }) 49979 #else 49980 #define vdupq_laneq_s16(__p0_403, __p1_403) __extension__ ({ \ 49981 int16x8_t __ret_403; \ 49982 int16x8_t __s0_403 = __p0_403; \ 49983 int16x8_t __rev0_403; __rev0_403 = __builtin_shufflevector(__s0_403, __s0_403, 7, 6, 5, 4, 3, 2, 1, 0); \ 49984 __ret_403 = __noswap_splatq_laneq_s16(__rev0_403, __p1_403); \ 49985 __ret_403 = __builtin_shufflevector(__ret_403, __ret_403, 7, 6, 5, 4, 3, 2, 1, 0); \ 49986 __ret_403; \ 49987 }) 49988 #endif 49989 49990 #ifdef __LITTLE_ENDIAN__ 49991 #define vdup_laneq_u8(__p0_404, __p1_404) __extension__ ({ \ 49992 uint8x8_t __ret_404; \ 49993 uint8x16_t __s0_404 = __p0_404; \ 49994 __ret_404 = splat_laneq_u8(__s0_404, __p1_404); \ 49995 __ret_404; \ 49996 }) 49997 #else 49998 #define vdup_laneq_u8(__p0_405, __p1_405) __extension__ ({ \ 49999 uint8x8_t __ret_405; \ 50000 uint8x16_t __s0_405 = __p0_405; \ 50001 uint8x16_t __rev0_405; __rev0_405 = __builtin_shufflevector(__s0_405, __s0_405, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 50002 __ret_405 = __noswap_splat_laneq_u8(__rev0_405, __p1_405); \ 50003 __ret_405 = __builtin_shufflevector(__ret_405, __ret_405, 7, 6, 5, 4, 3, 2, 1, 0); \ 50004 __ret_405; \ 50005 }) 50006 #endif 50007 50008 #ifdef __LITTLE_ENDIAN__ 50009 #define vdup_laneq_u32(__p0_406, __p1_406) __extension__ ({ \ 50010 uint32x2_t __ret_406; \ 50011 uint32x4_t __s0_406 = __p0_406; \ 50012 __ret_406 = splat_laneq_u32(__s0_406, __p1_406); \ 50013 __ret_406; \ 50014 }) 50015 #else 50016 #define vdup_laneq_u32(__p0_407, __p1_407) __extension__ ({ \ 50017 uint32x2_t __ret_407; \ 50018 uint32x4_t __s0_407 = __p0_407; \ 50019 uint32x4_t __rev0_407; __rev0_407 = __builtin_shufflevector(__s0_407, __s0_407, 3, 2, 1, 0); \ 50020 __ret_407 = __noswap_splat_laneq_u32(__rev0_407, __p1_407); \ 50021 __ret_407 = __builtin_shufflevector(__ret_407, __ret_407, 1, 0); \ 50022 __ret_407; \ 50023 }) 50024 #endif 50025 50026 #ifdef __LITTLE_ENDIAN__ 50027 #define vdup_laneq_u64(__p0_408, __p1_408) __extension__ ({ \ 50028 uint64x1_t __ret_408; \ 50029 uint64x2_t __s0_408 = __p0_408; \ 50030 __ret_408 = splat_laneq_u64(__s0_408, __p1_408); \ 50031 __ret_408; \ 50032 }) 50033 #else 50034 #define vdup_laneq_u64(__p0_409, __p1_409) __extension__ ({ \ 50035 uint64x1_t __ret_409; \ 50036 uint64x2_t __s0_409 = __p0_409; \ 50037 uint64x2_t __rev0_409; __rev0_409 = __builtin_shufflevector(__s0_409, __s0_409, 1, 0); \ 50038 __ret_409 = __noswap_splat_laneq_u64(__rev0_409, __p1_409); \ 50039 __ret_409; \ 50040 }) 50041 #endif 50042 50043 #ifdef __LITTLE_ENDIAN__ 50044 #define vdup_laneq_u16(__p0_410, __p1_410) __extension__ ({ \ 50045 uint16x4_t __ret_410; \ 50046 uint16x8_t __s0_410 = __p0_410; \ 50047 __ret_410 = splat_laneq_u16(__s0_410, __p1_410); \ 50048 __ret_410; \ 50049 }) 50050 #else 50051 #define vdup_laneq_u16(__p0_411, __p1_411) __extension__ ({ \ 50052 uint16x4_t __ret_411; \ 50053 uint16x8_t __s0_411 = __p0_411; \ 50054 uint16x8_t __rev0_411; __rev0_411 = __builtin_shufflevector(__s0_411, __s0_411, 7, 6, 5, 4, 3, 2, 1, 0); \ 50055 __ret_411 = __noswap_splat_laneq_u16(__rev0_411, __p1_411); \ 50056 __ret_411 = __builtin_shufflevector(__ret_411, __ret_411, 3, 2, 1, 0); \ 50057 __ret_411; \ 50058 }) 50059 #endif 50060 50061 #ifdef __LITTLE_ENDIAN__ 50062 #define vdup_laneq_s8(__p0_412, __p1_412) __extension__ ({ \ 50063 int8x8_t __ret_412; \ 50064 int8x16_t __s0_412 = __p0_412; \ 50065 __ret_412 = splat_laneq_s8(__s0_412, __p1_412); \ 50066 __ret_412; \ 50067 }) 50068 #else 50069 #define vdup_laneq_s8(__p0_413, __p1_413) __extension__ ({ \ 50070 int8x8_t __ret_413; \ 50071 int8x16_t __s0_413 = __p0_413; \ 50072 int8x16_t __rev0_413; __rev0_413 = __builtin_shufflevector(__s0_413, __s0_413, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 50073 __ret_413 = __noswap_splat_laneq_s8(__rev0_413, __p1_413); \ 50074 __ret_413 = __builtin_shufflevector(__ret_413, __ret_413, 7, 6, 5, 4, 3, 2, 1, 0); \ 50075 __ret_413; \ 50076 }) 50077 #endif 50078 50079 #ifdef __LITTLE_ENDIAN__ 50080 #define vdup_laneq_f64(__p0_414, __p1_414) __extension__ ({ \ 50081 float64x1_t __ret_414; \ 50082 float64x2_t __s0_414 = __p0_414; \ 50083 __ret_414 = splat_laneq_f64(__s0_414, __p1_414); \ 50084 __ret_414; \ 50085 }) 50086 #else 50087 #define vdup_laneq_f64(__p0_415, __p1_415) __extension__ ({ \ 50088 float64x1_t __ret_415; \ 50089 float64x2_t __s0_415 = __p0_415; \ 50090 float64x2_t __rev0_415; __rev0_415 = __builtin_shufflevector(__s0_415, __s0_415, 1, 0); \ 50091 __ret_415 = __noswap_splat_laneq_f64(__rev0_415, __p1_415); \ 50092 __ret_415; \ 50093 }) 50094 #endif 50095 50096 #ifdef __LITTLE_ENDIAN__ 50097 #define vdup_laneq_f32(__p0_416, __p1_416) __extension__ ({ \ 50098 float32x2_t __ret_416; \ 50099 float32x4_t __s0_416 = __p0_416; \ 50100 __ret_416 = splat_laneq_f32(__s0_416, __p1_416); \ 50101 __ret_416; \ 50102 }) 50103 #else 50104 #define vdup_laneq_f32(__p0_417, __p1_417) __extension__ ({ \ 50105 float32x2_t __ret_417; \ 50106 float32x4_t __s0_417 = __p0_417; \ 50107 float32x4_t __rev0_417; __rev0_417 = __builtin_shufflevector(__s0_417, __s0_417, 3, 2, 1, 0); \ 50108 __ret_417 = __noswap_splat_laneq_f32(__rev0_417, __p1_417); \ 50109 __ret_417 = __builtin_shufflevector(__ret_417, __ret_417, 1, 0); \ 50110 __ret_417; \ 50111 }) 50112 #endif 50113 50114 #ifdef __LITTLE_ENDIAN__ 50115 #define vdup_laneq_f16(__p0_418, __p1_418) __extension__ ({ \ 50116 float16x4_t __ret_418; \ 50117 float16x8_t __s0_418 = __p0_418; \ 50118 __ret_418 = splat_laneq_f16(__s0_418, __p1_418); \ 50119 __ret_418; \ 50120 }) 50121 #else 50122 #define vdup_laneq_f16(__p0_419, __p1_419) __extension__ ({ \ 50123 float16x4_t __ret_419; \ 50124 float16x8_t __s0_419 = __p0_419; \ 50125 float16x8_t __rev0_419; __rev0_419 = __builtin_shufflevector(__s0_419, __s0_419, 7, 6, 5, 4, 3, 2, 1, 0); \ 50126 __ret_419 = __noswap_splat_laneq_f16(__rev0_419, __p1_419); \ 50127 __ret_419 = __builtin_shufflevector(__ret_419, __ret_419, 3, 2, 1, 0); \ 50128 __ret_419; \ 50129 }) 50130 #endif 50131 50132 #ifdef __LITTLE_ENDIAN__ 50133 #define vdup_laneq_s32(__p0_420, __p1_420) __extension__ ({ \ 50134 int32x2_t __ret_420; \ 50135 int32x4_t __s0_420 = __p0_420; \ 50136 __ret_420 = splat_laneq_s32(__s0_420, __p1_420); \ 50137 __ret_420; \ 50138 }) 50139 #else 50140 #define vdup_laneq_s32(__p0_421, __p1_421) __extension__ ({ \ 50141 int32x2_t __ret_421; \ 50142 int32x4_t __s0_421 = __p0_421; \ 50143 int32x4_t __rev0_421; __rev0_421 = __builtin_shufflevector(__s0_421, __s0_421, 3, 2, 1, 0); \ 50144 __ret_421 = __noswap_splat_laneq_s32(__rev0_421, __p1_421); \ 50145 __ret_421 = __builtin_shufflevector(__ret_421, __ret_421, 1, 0); \ 50146 __ret_421; \ 50147 }) 50148 #endif 50149 50150 #ifdef __LITTLE_ENDIAN__ 50151 #define vdup_laneq_s64(__p0_422, __p1_422) __extension__ ({ \ 50152 int64x1_t __ret_422; \ 50153 int64x2_t __s0_422 = __p0_422; \ 50154 __ret_422 = splat_laneq_s64(__s0_422, __p1_422); \ 50155 __ret_422; \ 50156 }) 50157 #else 50158 #define vdup_laneq_s64(__p0_423, __p1_423) __extension__ ({ \ 50159 int64x1_t __ret_423; \ 50160 int64x2_t __s0_423 = __p0_423; \ 50161 int64x2_t __rev0_423; __rev0_423 = __builtin_shufflevector(__s0_423, __s0_423, 1, 0); \ 50162 __ret_423 = __noswap_splat_laneq_s64(__rev0_423, __p1_423); \ 50163 __ret_423; \ 50164 }) 50165 #endif 50166 50167 #ifdef __LITTLE_ENDIAN__ 50168 #define vdup_laneq_s16(__p0_424, __p1_424) __extension__ ({ \ 50169 int16x4_t __ret_424; \ 50170 int16x8_t __s0_424 = __p0_424; \ 50171 __ret_424 = splat_laneq_s16(__s0_424, __p1_424); \ 50172 __ret_424; \ 50173 }) 50174 #else 50175 #define vdup_laneq_s16(__p0_425, __p1_425) __extension__ ({ \ 50176 int16x4_t __ret_425; \ 50177 int16x8_t __s0_425 = __p0_425; \ 50178 int16x8_t __rev0_425; __rev0_425 = __builtin_shufflevector(__s0_425, __s0_425, 7, 6, 5, 4, 3, 2, 1, 0); \ 50179 __ret_425 = __noswap_splat_laneq_s16(__rev0_425, __p1_425); \ 50180 __ret_425 = __builtin_shufflevector(__ret_425, __ret_425, 3, 2, 1, 0); \ 50181 __ret_425; \ 50182 }) 50183 #endif 50184 50185 __ai __attribute__((target("neon"))) poly64x1_t vdup_n_p64(poly64_t __p0) { 50186 poly64x1_t __ret; 50187 __ret = (poly64x1_t) {__p0}; 50188 return __ret; 50189 } 50190 #ifdef __LITTLE_ENDIAN__ 50191 __ai __attribute__((target("neon"))) poly64x2_t vdupq_n_p64(poly64_t __p0) { 50192 poly64x2_t __ret; 50193 __ret = (poly64x2_t) {__p0, __p0}; 50194 return __ret; 50195 } 50196 #else 50197 __ai __attribute__((target("neon"))) poly64x2_t vdupq_n_p64(poly64_t __p0) { 50198 poly64x2_t __ret; 50199 __ret = (poly64x2_t) {__p0, __p0}; 50200 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 50201 return __ret; 50202 } 50203 #endif 50204 50205 #ifdef __LITTLE_ENDIAN__ 50206 __ai __attribute__((target("neon"))) float64x2_t vdupq_n_f64(float64_t __p0) { 50207 float64x2_t __ret; 50208 __ret = (float64x2_t) {__p0, __p0}; 50209 return __ret; 50210 } 50211 #else 50212 __ai __attribute__((target("neon"))) float64x2_t vdupq_n_f64(float64_t __p0) { 50213 float64x2_t __ret; 50214 __ret = (float64x2_t) {__p0, __p0}; 50215 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 50216 return __ret; 50217 } 50218 #endif 50219 50220 __ai __attribute__((target("neon"))) float64x1_t vdup_n_f64(float64_t __p0) { 50221 float64x1_t __ret; 50222 __ret = (float64x1_t) {__p0}; 50223 return __ret; 50224 } 50225 #define vext_p64(__p0, __p1, __p2) __extension__ ({ \ 50226 poly64x1_t __ret; \ 50227 poly64x1_t __s0 = __p0; \ 50228 poly64x1_t __s1 = __p1; \ 50229 __ret = (poly64x1_t) __builtin_neon_vext_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 6); \ 50230 __ret; \ 50231 }) 50232 #ifdef __LITTLE_ENDIAN__ 50233 #define vextq_p64(__p0, __p1, __p2) __extension__ ({ \ 50234 poly64x2_t __ret; \ 50235 poly64x2_t __s0 = __p0; \ 50236 poly64x2_t __s1 = __p1; \ 50237 __ret = (poly64x2_t) __builtin_neon_vextq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 38); \ 50238 __ret; \ 50239 }) 50240 #else 50241 #define vextq_p64(__p0, __p1, __p2) __extension__ ({ \ 50242 poly64x2_t __ret; \ 50243 poly64x2_t __s0 = __p0; \ 50244 poly64x2_t __s1 = __p1; \ 50245 poly64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 50246 poly64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 50247 __ret = (poly64x2_t) __builtin_neon_vextq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 38); \ 50248 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 50249 __ret; \ 50250 }) 50251 #endif 50252 50253 #ifdef __LITTLE_ENDIAN__ 50254 #define vextq_f64(__p0, __p1, __p2) __extension__ ({ \ 50255 float64x2_t __ret; \ 50256 float64x2_t __s0 = __p0; \ 50257 float64x2_t __s1 = __p1; \ 50258 __ret = (float64x2_t) __builtin_neon_vextq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 42); \ 50259 __ret; \ 50260 }) 50261 #else 50262 #define vextq_f64(__p0, __p1, __p2) __extension__ ({ \ 50263 float64x2_t __ret; \ 50264 float64x2_t __s0 = __p0; \ 50265 float64x2_t __s1 = __p1; \ 50266 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 50267 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 50268 __ret = (float64x2_t) __builtin_neon_vextq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 42); \ 50269 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 50270 __ret; \ 50271 }) 50272 #endif 50273 50274 #define vext_f64(__p0, __p1, __p2) __extension__ ({ \ 50275 float64x1_t __ret; \ 50276 float64x1_t __s0 = __p0; \ 50277 float64x1_t __s1 = __p1; \ 50278 __ret = (float64x1_t) __builtin_neon_vext_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 10); \ 50279 __ret; \ 50280 }) 50281 #ifdef __LITTLE_ENDIAN__ 50282 __ai __attribute__((target("neon"))) float64x2_t vfmaq_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) { 50283 float64x2_t __ret; 50284 __ret = (float64x2_t) __builtin_neon_vfmaq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 42); 50285 return __ret; 50286 } 50287 #else 50288 __ai __attribute__((target("neon"))) float64x2_t vfmaq_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) { 50289 float64x2_t __ret; 50290 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 50291 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 50292 float64x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 50293 __ret = (float64x2_t) __builtin_neon_vfmaq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 42); 50294 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 50295 return __ret; 50296 } 50297 __ai __attribute__((target("neon"))) float64x2_t __noswap_vfmaq_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) { 50298 float64x2_t __ret; 50299 __ret = (float64x2_t) __builtin_neon_vfmaq_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 42); 50300 return __ret; 50301 } 50302 #endif 50303 50304 __ai __attribute__((target("neon"))) float64x1_t vfma_f64(float64x1_t __p0, float64x1_t __p1, float64x1_t __p2) { 50305 float64x1_t __ret; 50306 __ret = (float64x1_t) __builtin_neon_vfma_v((int8x8_t)__p0, (int8x8_t)__p1, (int8x8_t)__p2, 10); 50307 return __ret; 50308 } 50309 #define vfmad_lane_f64(__p0, __p1, __p2, __p3) __extension__ ({ \ 50310 float64_t __ret; \ 50311 float64_t __s0 = __p0; \ 50312 float64_t __s1 = __p1; \ 50313 float64x1_t __s2 = __p2; \ 50314 __ret = (float64_t) __builtin_neon_vfmad_lane_f64(__s0, __s1, (float64x1_t)__s2, __p3); \ 50315 __ret; \ 50316 }) 50317 #ifdef __LITTLE_ENDIAN__ 50318 #define vfmas_lane_f32(__p0, __p1, __p2, __p3) __extension__ ({ \ 50319 float32_t __ret; \ 50320 float32_t __s0 = __p0; \ 50321 float32_t __s1 = __p1; \ 50322 float32x2_t __s2 = __p2; \ 50323 __ret = (float32_t) __builtin_neon_vfmas_lane_f32(__s0, __s1, (float32x2_t)__s2, __p3); \ 50324 __ret; \ 50325 }) 50326 #else 50327 #define vfmas_lane_f32(__p0, __p1, __p2, __p3) __extension__ ({ \ 50328 float32_t __ret; \ 50329 float32_t __s0 = __p0; \ 50330 float32_t __s1 = __p1; \ 50331 float32x2_t __s2 = __p2; \ 50332 float32x2_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 1, 0); \ 50333 __ret = (float32_t) __builtin_neon_vfmas_lane_f32(__s0, __s1, (float32x2_t)__rev2, __p3); \ 50334 __ret; \ 50335 }) 50336 #define __noswap_vfmas_lane_f32(__p0, __p1, __p2, __p3) __extension__ ({ \ 50337 float32_t __ret; \ 50338 float32_t __s0 = __p0; \ 50339 float32_t __s1 = __p1; \ 50340 float32x2_t __s2 = __p2; \ 50341 __ret = (float32_t) __builtin_neon_vfmas_lane_f32(__s0, __s1, (float32x2_t)__s2, __p3); \ 50342 __ret; \ 50343 }) 50344 #endif 50345 50346 #ifdef __LITTLE_ENDIAN__ 50347 #define vfmaq_lane_f64(__p0, __p1, __p2, __p3) __extension__ ({ \ 50348 float64x2_t __ret; \ 50349 float64x2_t __s0 = __p0; \ 50350 float64x2_t __s1 = __p1; \ 50351 float64x1_t __s2 = __p2; \ 50352 __ret = (float64x2_t) __builtin_neon_vfmaq_lane_v((int8x16_t)__s0, (int8x16_t)__s1, (int8x8_t)__s2, __p3, 42); \ 50353 __ret; \ 50354 }) 50355 #else 50356 #define vfmaq_lane_f64(__p0, __p1, __p2, __p3) __extension__ ({ \ 50357 float64x2_t __ret; \ 50358 float64x2_t __s0 = __p0; \ 50359 float64x2_t __s1 = __p1; \ 50360 float64x1_t __s2 = __p2; \ 50361 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 50362 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 50363 __ret = (float64x2_t) __builtin_neon_vfmaq_lane_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x8_t)__s2, __p3, 42); \ 50364 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 50365 __ret; \ 50366 }) 50367 #define __noswap_vfmaq_lane_f64(__p0, __p1, __p2, __p3) __extension__ ({ \ 50368 float64x2_t __ret; \ 50369 float64x2_t __s0 = __p0; \ 50370 float64x2_t __s1 = __p1; \ 50371 float64x1_t __s2 = __p2; \ 50372 __ret = (float64x2_t) __builtin_neon_vfmaq_lane_v((int8x16_t)__s0, (int8x16_t)__s1, (int8x8_t)__s2, __p3, 42); \ 50373 __ret; \ 50374 }) 50375 #endif 50376 50377 #ifdef __LITTLE_ENDIAN__ 50378 #define vfmaq_lane_f32(__p0, __p1, __p2, __p3) __extension__ ({ \ 50379 float32x4_t __ret; \ 50380 float32x4_t __s0 = __p0; \ 50381 float32x4_t __s1 = __p1; \ 50382 float32x2_t __s2 = __p2; \ 50383 __ret = (float32x4_t) __builtin_neon_vfmaq_lane_v((int8x16_t)__s0, (int8x16_t)__s1, (int8x8_t)__s2, __p3, 41); \ 50384 __ret; \ 50385 }) 50386 #else 50387 #define vfmaq_lane_f32(__p0, __p1, __p2, __p3) __extension__ ({ \ 50388 float32x4_t __ret; \ 50389 float32x4_t __s0 = __p0; \ 50390 float32x4_t __s1 = __p1; \ 50391 float32x2_t __s2 = __p2; \ 50392 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 50393 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 50394 float32x2_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 1, 0); \ 50395 __ret = (float32x4_t) __builtin_neon_vfmaq_lane_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x8_t)__rev2, __p3, 41); \ 50396 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 50397 __ret; \ 50398 }) 50399 #define __noswap_vfmaq_lane_f32(__p0, __p1, __p2, __p3) __extension__ ({ \ 50400 float32x4_t __ret; \ 50401 float32x4_t __s0 = __p0; \ 50402 float32x4_t __s1 = __p1; \ 50403 float32x2_t __s2 = __p2; \ 50404 __ret = (float32x4_t) __builtin_neon_vfmaq_lane_v((int8x16_t)__s0, (int8x16_t)__s1, (int8x8_t)__s2, __p3, 41); \ 50405 __ret; \ 50406 }) 50407 #endif 50408 50409 #define vfma_lane_f64(__p0, __p1, __p2, __p3) __extension__ ({ \ 50410 float64x1_t __ret; \ 50411 float64x1_t __s0 = __p0; \ 50412 float64x1_t __s1 = __p1; \ 50413 float64x1_t __s2 = __p2; \ 50414 __ret = (float64x1_t) __builtin_neon_vfma_lane_v((int8x8_t)__s0, (int8x8_t)__s1, (int8x8_t)__s2, __p3, 10); \ 50415 __ret; \ 50416 }) 50417 #ifdef __LITTLE_ENDIAN__ 50418 #define vfma_lane_f32(__p0, __p1, __p2, __p3) __extension__ ({ \ 50419 float32x2_t __ret; \ 50420 float32x2_t __s0 = __p0; \ 50421 float32x2_t __s1 = __p1; \ 50422 float32x2_t __s2 = __p2; \ 50423 __ret = (float32x2_t) __builtin_neon_vfma_lane_v((int8x8_t)__s0, (int8x8_t)__s1, (int8x8_t)__s2, __p3, 9); \ 50424 __ret; \ 50425 }) 50426 #else 50427 #define vfma_lane_f32(__p0, __p1, __p2, __p3) __extension__ ({ \ 50428 float32x2_t __ret; \ 50429 float32x2_t __s0 = __p0; \ 50430 float32x2_t __s1 = __p1; \ 50431 float32x2_t __s2 = __p2; \ 50432 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 50433 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 50434 float32x2_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 1, 0); \ 50435 __ret = (float32x2_t) __builtin_neon_vfma_lane_v((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x8_t)__rev2, __p3, 9); \ 50436 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 50437 __ret; \ 50438 }) 50439 #define __noswap_vfma_lane_f32(__p0, __p1, __p2, __p3) __extension__ ({ \ 50440 float32x2_t __ret; \ 50441 float32x2_t __s0 = __p0; \ 50442 float32x2_t __s1 = __p1; \ 50443 float32x2_t __s2 = __p2; \ 50444 __ret = (float32x2_t) __builtin_neon_vfma_lane_v((int8x8_t)__s0, (int8x8_t)__s1, (int8x8_t)__s2, __p3, 9); \ 50445 __ret; \ 50446 }) 50447 #endif 50448 50449 #ifdef __LITTLE_ENDIAN__ 50450 #define vfmad_laneq_f64(__p0, __p1, __p2, __p3) __extension__ ({ \ 50451 float64_t __ret; \ 50452 float64_t __s0 = __p0; \ 50453 float64_t __s1 = __p1; \ 50454 float64x2_t __s2 = __p2; \ 50455 __ret = (float64_t) __builtin_neon_vfmad_laneq_f64(__s0, __s1, (float64x2_t)__s2, __p3); \ 50456 __ret; \ 50457 }) 50458 #else 50459 #define vfmad_laneq_f64(__p0, __p1, __p2, __p3) __extension__ ({ \ 50460 float64_t __ret; \ 50461 float64_t __s0 = __p0; \ 50462 float64_t __s1 = __p1; \ 50463 float64x2_t __s2 = __p2; \ 50464 float64x2_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 1, 0); \ 50465 __ret = (float64_t) __builtin_neon_vfmad_laneq_f64(__s0, __s1, (float64x2_t)__rev2, __p3); \ 50466 __ret; \ 50467 }) 50468 #define __noswap_vfmad_laneq_f64(__p0, __p1, __p2, __p3) __extension__ ({ \ 50469 float64_t __ret; \ 50470 float64_t __s0 = __p0; \ 50471 float64_t __s1 = __p1; \ 50472 float64x2_t __s2 = __p2; \ 50473 __ret = (float64_t) __builtin_neon_vfmad_laneq_f64(__s0, __s1, (float64x2_t)__s2, __p3); \ 50474 __ret; \ 50475 }) 50476 #endif 50477 50478 #ifdef __LITTLE_ENDIAN__ 50479 #define vfmas_laneq_f32(__p0, __p1, __p2, __p3) __extension__ ({ \ 50480 float32_t __ret; \ 50481 float32_t __s0 = __p0; \ 50482 float32_t __s1 = __p1; \ 50483 float32x4_t __s2 = __p2; \ 50484 __ret = (float32_t) __builtin_neon_vfmas_laneq_f32(__s0, __s1, (float32x4_t)__s2, __p3); \ 50485 __ret; \ 50486 }) 50487 #else 50488 #define vfmas_laneq_f32(__p0, __p1, __p2, __p3) __extension__ ({ \ 50489 float32_t __ret; \ 50490 float32_t __s0 = __p0; \ 50491 float32_t __s1 = __p1; \ 50492 float32x4_t __s2 = __p2; \ 50493 float32x4_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 3, 2, 1, 0); \ 50494 __ret = (float32_t) __builtin_neon_vfmas_laneq_f32(__s0, __s1, (float32x4_t)__rev2, __p3); \ 50495 __ret; \ 50496 }) 50497 #define __noswap_vfmas_laneq_f32(__p0, __p1, __p2, __p3) __extension__ ({ \ 50498 float32_t __ret; \ 50499 float32_t __s0 = __p0; \ 50500 float32_t __s1 = __p1; \ 50501 float32x4_t __s2 = __p2; \ 50502 __ret = (float32_t) __builtin_neon_vfmas_laneq_f32(__s0, __s1, (float32x4_t)__s2, __p3); \ 50503 __ret; \ 50504 }) 50505 #endif 50506 50507 #ifdef __LITTLE_ENDIAN__ 50508 #define vfmaq_laneq_f64(__p0, __p1, __p2, __p3) __extension__ ({ \ 50509 float64x2_t __ret; \ 50510 float64x2_t __s0 = __p0; \ 50511 float64x2_t __s1 = __p1; \ 50512 float64x2_t __s2 = __p2; \ 50513 __ret = (float64x2_t) __builtin_neon_vfmaq_laneq_v((int8x16_t)__s0, (int8x16_t)__s1, (int8x16_t)__s2, __p3, 42); \ 50514 __ret; \ 50515 }) 50516 #else 50517 #define vfmaq_laneq_f64(__p0, __p1, __p2, __p3) __extension__ ({ \ 50518 float64x2_t __ret; \ 50519 float64x2_t __s0 = __p0; \ 50520 float64x2_t __s1 = __p1; \ 50521 float64x2_t __s2 = __p2; \ 50522 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 50523 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 50524 float64x2_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 1, 0); \ 50525 __ret = (float64x2_t) __builtin_neon_vfmaq_laneq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, __p3, 42); \ 50526 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 50527 __ret; \ 50528 }) 50529 #define __noswap_vfmaq_laneq_f64(__p0, __p1, __p2, __p3) __extension__ ({ \ 50530 float64x2_t __ret; \ 50531 float64x2_t __s0 = __p0; \ 50532 float64x2_t __s1 = __p1; \ 50533 float64x2_t __s2 = __p2; \ 50534 __ret = (float64x2_t) __builtin_neon_vfmaq_laneq_v((int8x16_t)__s0, (int8x16_t)__s1, (int8x16_t)__s2, __p3, 42); \ 50535 __ret; \ 50536 }) 50537 #endif 50538 50539 #ifdef __LITTLE_ENDIAN__ 50540 #define vfmaq_laneq_f32(__p0, __p1, __p2, __p3) __extension__ ({ \ 50541 float32x4_t __ret; \ 50542 float32x4_t __s0 = __p0; \ 50543 float32x4_t __s1 = __p1; \ 50544 float32x4_t __s2 = __p2; \ 50545 __ret = (float32x4_t) __builtin_neon_vfmaq_laneq_v((int8x16_t)__s0, (int8x16_t)__s1, (int8x16_t)__s2, __p3, 41); \ 50546 __ret; \ 50547 }) 50548 #else 50549 #define vfmaq_laneq_f32(__p0, __p1, __p2, __p3) __extension__ ({ \ 50550 float32x4_t __ret; \ 50551 float32x4_t __s0 = __p0; \ 50552 float32x4_t __s1 = __p1; \ 50553 float32x4_t __s2 = __p2; \ 50554 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 50555 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 50556 float32x4_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 3, 2, 1, 0); \ 50557 __ret = (float32x4_t) __builtin_neon_vfmaq_laneq_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, __p3, 41); \ 50558 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 50559 __ret; \ 50560 }) 50561 #define __noswap_vfmaq_laneq_f32(__p0, __p1, __p2, __p3) __extension__ ({ \ 50562 float32x4_t __ret; \ 50563 float32x4_t __s0 = __p0; \ 50564 float32x4_t __s1 = __p1; \ 50565 float32x4_t __s2 = __p2; \ 50566 __ret = (float32x4_t) __builtin_neon_vfmaq_laneq_v((int8x16_t)__s0, (int8x16_t)__s1, (int8x16_t)__s2, __p3, 41); \ 50567 __ret; \ 50568 }) 50569 #endif 50570 50571 #ifdef __LITTLE_ENDIAN__ 50572 #define vfma_laneq_f64(__p0, __p1, __p2, __p3) __extension__ ({ \ 50573 float64x1_t __ret; \ 50574 float64x1_t __s0 = __p0; \ 50575 float64x1_t __s1 = __p1; \ 50576 float64x2_t __s2 = __p2; \ 50577 __ret = (float64x1_t) __builtin_neon_vfma_laneq_v((int8x8_t)__s0, (int8x8_t)__s1, (int8x16_t)__s2, __p3, 10); \ 50578 __ret; \ 50579 }) 50580 #else 50581 #define vfma_laneq_f64(__p0, __p1, __p2, __p3) __extension__ ({ \ 50582 float64x1_t __ret; \ 50583 float64x1_t __s0 = __p0; \ 50584 float64x1_t __s1 = __p1; \ 50585 float64x2_t __s2 = __p2; \ 50586 float64x2_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 1, 0); \ 50587 __ret = (float64x1_t) __builtin_neon_vfma_laneq_v((int8x8_t)__s0, (int8x8_t)__s1, (int8x16_t)__rev2, __p3, 10); \ 50588 __ret; \ 50589 }) 50590 #define __noswap_vfma_laneq_f64(__p0, __p1, __p2, __p3) __extension__ ({ \ 50591 float64x1_t __ret; \ 50592 float64x1_t __s0 = __p0; \ 50593 float64x1_t __s1 = __p1; \ 50594 float64x2_t __s2 = __p2; \ 50595 __ret = (float64x1_t) __builtin_neon_vfma_laneq_v((int8x8_t)__s0, (int8x8_t)__s1, (int8x16_t)__s2, __p3, 10); \ 50596 __ret; \ 50597 }) 50598 #endif 50599 50600 #ifdef __LITTLE_ENDIAN__ 50601 #define vfma_laneq_f32(__p0, __p1, __p2, __p3) __extension__ ({ \ 50602 float32x2_t __ret; \ 50603 float32x2_t __s0 = __p0; \ 50604 float32x2_t __s1 = __p1; \ 50605 float32x4_t __s2 = __p2; \ 50606 __ret = (float32x2_t) __builtin_neon_vfma_laneq_v((int8x8_t)__s0, (int8x8_t)__s1, (int8x16_t)__s2, __p3, 9); \ 50607 __ret; \ 50608 }) 50609 #else 50610 #define vfma_laneq_f32(__p0, __p1, __p2, __p3) __extension__ ({ \ 50611 float32x2_t __ret; \ 50612 float32x2_t __s0 = __p0; \ 50613 float32x2_t __s1 = __p1; \ 50614 float32x4_t __s2 = __p2; \ 50615 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 50616 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 50617 float32x4_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 3, 2, 1, 0); \ 50618 __ret = (float32x2_t) __builtin_neon_vfma_laneq_v((int8x8_t)__rev0, (int8x8_t)__rev1, (int8x16_t)__rev2, __p3, 9); \ 50619 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 50620 __ret; \ 50621 }) 50622 #define __noswap_vfma_laneq_f32(__p0, __p1, __p2, __p3) __extension__ ({ \ 50623 float32x2_t __ret; \ 50624 float32x2_t __s0 = __p0; \ 50625 float32x2_t __s1 = __p1; \ 50626 float32x4_t __s2 = __p2; \ 50627 __ret = (float32x2_t) __builtin_neon_vfma_laneq_v((int8x8_t)__s0, (int8x8_t)__s1, (int8x16_t)__s2, __p3, 9); \ 50628 __ret; \ 50629 }) 50630 #endif 50631 50632 #ifdef __LITTLE_ENDIAN__ 50633 __ai __attribute__((target("neon"))) float64x2_t vfmaq_n_f64(float64x2_t __p0, float64x2_t __p1, float64_t __p2) { 50634 float64x2_t __ret; 50635 __ret = vfmaq_f64(__p0, __p1, (float64x2_t) {__p2, __p2}); 50636 return __ret; 50637 } 50638 #else 50639 __ai __attribute__((target("neon"))) float64x2_t vfmaq_n_f64(float64x2_t __p0, float64x2_t __p1, float64_t __p2) { 50640 float64x2_t __ret; 50641 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 50642 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 50643 __ret = __noswap_vfmaq_f64(__rev0, __rev1, (float64x2_t) {__p2, __p2}); 50644 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 50645 return __ret; 50646 } 50647 #endif 50648 50649 __ai __attribute__((target("neon"))) float64x1_t vfma_n_f64(float64x1_t __p0, float64x1_t __p1, float64_t __p2) { 50650 float64x1_t __ret; 50651 __ret = vfma_f64(__p0, __p1, (float64x1_t) {__p2}); 50652 return __ret; 50653 } 50654 #ifdef __LITTLE_ENDIAN__ 50655 __ai __attribute__((target("neon"))) float64x2_t vfmsq_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) { 50656 float64x2_t __ret; 50657 __ret = vfmaq_f64(__p0, -__p1, __p2); 50658 return __ret; 50659 } 50660 #else 50661 __ai __attribute__((target("neon"))) float64x2_t vfmsq_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) { 50662 float64x2_t __ret; 50663 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 50664 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 50665 float64x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 50666 __ret = __noswap_vfmaq_f64(__rev0, -__rev1, __rev2); 50667 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 50668 return __ret; 50669 } 50670 #endif 50671 50672 __ai __attribute__((target("neon"))) float64x1_t vfms_f64(float64x1_t __p0, float64x1_t __p1, float64x1_t __p2) { 50673 float64x1_t __ret; 50674 __ret = vfma_f64(__p0, -__p1, __p2); 50675 return __ret; 50676 } 50677 #define vfmsd_lane_f64(__p0_426, __p1_426, __p2_426, __p3_426) __extension__ ({ \ 50678 float64_t __ret_426; \ 50679 float64_t __s0_426 = __p0_426; \ 50680 float64_t __s1_426 = __p1_426; \ 50681 float64x1_t __s2_426 = __p2_426; \ 50682 __ret_426 = vfmad_lane_f64(__s0_426, -__s1_426, __s2_426, __p3_426); \ 50683 __ret_426; \ 50684 }) 50685 #ifdef __LITTLE_ENDIAN__ 50686 #define vfmss_lane_f32(__p0_427, __p1_427, __p2_427, __p3_427) __extension__ ({ \ 50687 float32_t __ret_427; \ 50688 float32_t __s0_427 = __p0_427; \ 50689 float32_t __s1_427 = __p1_427; \ 50690 float32x2_t __s2_427 = __p2_427; \ 50691 __ret_427 = vfmas_lane_f32(__s0_427, -__s1_427, __s2_427, __p3_427); \ 50692 __ret_427; \ 50693 }) 50694 #else 50695 #define vfmss_lane_f32(__p0_428, __p1_428, __p2_428, __p3_428) __extension__ ({ \ 50696 float32_t __ret_428; \ 50697 float32_t __s0_428 = __p0_428; \ 50698 float32_t __s1_428 = __p1_428; \ 50699 float32x2_t __s2_428 = __p2_428; \ 50700 float32x2_t __rev2_428; __rev2_428 = __builtin_shufflevector(__s2_428, __s2_428, 1, 0); \ 50701 __ret_428 = __noswap_vfmas_lane_f32(__s0_428, -__s1_428, __rev2_428, __p3_428); \ 50702 __ret_428; \ 50703 }) 50704 #endif 50705 50706 #ifdef __LITTLE_ENDIAN__ 50707 #define vfmsq_lane_f64(__p0_429, __p1_429, __p2_429, __p3_429) __extension__ ({ \ 50708 float64x2_t __ret_429; \ 50709 float64x2_t __s0_429 = __p0_429; \ 50710 float64x2_t __s1_429 = __p1_429; \ 50711 float64x1_t __s2_429 = __p2_429; \ 50712 __ret_429 = vfmaq_lane_f64(__s0_429, -__s1_429, __s2_429, __p3_429); \ 50713 __ret_429; \ 50714 }) 50715 #else 50716 #define vfmsq_lane_f64(__p0_430, __p1_430, __p2_430, __p3_430) __extension__ ({ \ 50717 float64x2_t __ret_430; \ 50718 float64x2_t __s0_430 = __p0_430; \ 50719 float64x2_t __s1_430 = __p1_430; \ 50720 float64x1_t __s2_430 = __p2_430; \ 50721 float64x2_t __rev0_430; __rev0_430 = __builtin_shufflevector(__s0_430, __s0_430, 1, 0); \ 50722 float64x2_t __rev1_430; __rev1_430 = __builtin_shufflevector(__s1_430, __s1_430, 1, 0); \ 50723 __ret_430 = __noswap_vfmaq_lane_f64(__rev0_430, -__rev1_430, __s2_430, __p3_430); \ 50724 __ret_430 = __builtin_shufflevector(__ret_430, __ret_430, 1, 0); \ 50725 __ret_430; \ 50726 }) 50727 #endif 50728 50729 #ifdef __LITTLE_ENDIAN__ 50730 #define vfmsq_lane_f32(__p0_431, __p1_431, __p2_431, __p3_431) __extension__ ({ \ 50731 float32x4_t __ret_431; \ 50732 float32x4_t __s0_431 = __p0_431; \ 50733 float32x4_t __s1_431 = __p1_431; \ 50734 float32x2_t __s2_431 = __p2_431; \ 50735 __ret_431 = vfmaq_lane_f32(__s0_431, -__s1_431, __s2_431, __p3_431); \ 50736 __ret_431; \ 50737 }) 50738 #else 50739 #define vfmsq_lane_f32(__p0_432, __p1_432, __p2_432, __p3_432) __extension__ ({ \ 50740 float32x4_t __ret_432; \ 50741 float32x4_t __s0_432 = __p0_432; \ 50742 float32x4_t __s1_432 = __p1_432; \ 50743 float32x2_t __s2_432 = __p2_432; \ 50744 float32x4_t __rev0_432; __rev0_432 = __builtin_shufflevector(__s0_432, __s0_432, 3, 2, 1, 0); \ 50745 float32x4_t __rev1_432; __rev1_432 = __builtin_shufflevector(__s1_432, __s1_432, 3, 2, 1, 0); \ 50746 float32x2_t __rev2_432; __rev2_432 = __builtin_shufflevector(__s2_432, __s2_432, 1, 0); \ 50747 __ret_432 = __noswap_vfmaq_lane_f32(__rev0_432, -__rev1_432, __rev2_432, __p3_432); \ 50748 __ret_432 = __builtin_shufflevector(__ret_432, __ret_432, 3, 2, 1, 0); \ 50749 __ret_432; \ 50750 }) 50751 #endif 50752 50753 #define vfms_lane_f64(__p0_433, __p1_433, __p2_433, __p3_433) __extension__ ({ \ 50754 float64x1_t __ret_433; \ 50755 float64x1_t __s0_433 = __p0_433; \ 50756 float64x1_t __s1_433 = __p1_433; \ 50757 float64x1_t __s2_433 = __p2_433; \ 50758 __ret_433 = vfma_lane_f64(__s0_433, -__s1_433, __s2_433, __p3_433); \ 50759 __ret_433; \ 50760 }) 50761 #ifdef __LITTLE_ENDIAN__ 50762 #define vfms_lane_f32(__p0_434, __p1_434, __p2_434, __p3_434) __extension__ ({ \ 50763 float32x2_t __ret_434; \ 50764 float32x2_t __s0_434 = __p0_434; \ 50765 float32x2_t __s1_434 = __p1_434; \ 50766 float32x2_t __s2_434 = __p2_434; \ 50767 __ret_434 = vfma_lane_f32(__s0_434, -__s1_434, __s2_434, __p3_434); \ 50768 __ret_434; \ 50769 }) 50770 #else 50771 #define vfms_lane_f32(__p0_435, __p1_435, __p2_435, __p3_435) __extension__ ({ \ 50772 float32x2_t __ret_435; \ 50773 float32x2_t __s0_435 = __p0_435; \ 50774 float32x2_t __s1_435 = __p1_435; \ 50775 float32x2_t __s2_435 = __p2_435; \ 50776 float32x2_t __rev0_435; __rev0_435 = __builtin_shufflevector(__s0_435, __s0_435, 1, 0); \ 50777 float32x2_t __rev1_435; __rev1_435 = __builtin_shufflevector(__s1_435, __s1_435, 1, 0); \ 50778 float32x2_t __rev2_435; __rev2_435 = __builtin_shufflevector(__s2_435, __s2_435, 1, 0); \ 50779 __ret_435 = __noswap_vfma_lane_f32(__rev0_435, -__rev1_435, __rev2_435, __p3_435); \ 50780 __ret_435 = __builtin_shufflevector(__ret_435, __ret_435, 1, 0); \ 50781 __ret_435; \ 50782 }) 50783 #endif 50784 50785 #ifdef __LITTLE_ENDIAN__ 50786 #define vfmsd_laneq_f64(__p0_436, __p1_436, __p2_436, __p3_436) __extension__ ({ \ 50787 float64_t __ret_436; \ 50788 float64_t __s0_436 = __p0_436; \ 50789 float64_t __s1_436 = __p1_436; \ 50790 float64x2_t __s2_436 = __p2_436; \ 50791 __ret_436 = vfmad_laneq_f64(__s0_436, -__s1_436, __s2_436, __p3_436); \ 50792 __ret_436; \ 50793 }) 50794 #else 50795 #define vfmsd_laneq_f64(__p0_437, __p1_437, __p2_437, __p3_437) __extension__ ({ \ 50796 float64_t __ret_437; \ 50797 float64_t __s0_437 = __p0_437; \ 50798 float64_t __s1_437 = __p1_437; \ 50799 float64x2_t __s2_437 = __p2_437; \ 50800 float64x2_t __rev2_437; __rev2_437 = __builtin_shufflevector(__s2_437, __s2_437, 1, 0); \ 50801 __ret_437 = __noswap_vfmad_laneq_f64(__s0_437, -__s1_437, __rev2_437, __p3_437); \ 50802 __ret_437; \ 50803 }) 50804 #endif 50805 50806 #ifdef __LITTLE_ENDIAN__ 50807 #define vfmss_laneq_f32(__p0_438, __p1_438, __p2_438, __p3_438) __extension__ ({ \ 50808 float32_t __ret_438; \ 50809 float32_t __s0_438 = __p0_438; \ 50810 float32_t __s1_438 = __p1_438; \ 50811 float32x4_t __s2_438 = __p2_438; \ 50812 __ret_438 = vfmas_laneq_f32(__s0_438, -__s1_438, __s2_438, __p3_438); \ 50813 __ret_438; \ 50814 }) 50815 #else 50816 #define vfmss_laneq_f32(__p0_439, __p1_439, __p2_439, __p3_439) __extension__ ({ \ 50817 float32_t __ret_439; \ 50818 float32_t __s0_439 = __p0_439; \ 50819 float32_t __s1_439 = __p1_439; \ 50820 float32x4_t __s2_439 = __p2_439; \ 50821 float32x4_t __rev2_439; __rev2_439 = __builtin_shufflevector(__s2_439, __s2_439, 3, 2, 1, 0); \ 50822 __ret_439 = __noswap_vfmas_laneq_f32(__s0_439, -__s1_439, __rev2_439, __p3_439); \ 50823 __ret_439; \ 50824 }) 50825 #endif 50826 50827 #ifdef __LITTLE_ENDIAN__ 50828 #define vfmsq_laneq_f64(__p0_440, __p1_440, __p2_440, __p3_440) __extension__ ({ \ 50829 float64x2_t __ret_440; \ 50830 float64x2_t __s0_440 = __p0_440; \ 50831 float64x2_t __s1_440 = __p1_440; \ 50832 float64x2_t __s2_440 = __p2_440; \ 50833 __ret_440 = vfmaq_laneq_f64(__s0_440, -__s1_440, __s2_440, __p3_440); \ 50834 __ret_440; \ 50835 }) 50836 #else 50837 #define vfmsq_laneq_f64(__p0_441, __p1_441, __p2_441, __p3_441) __extension__ ({ \ 50838 float64x2_t __ret_441; \ 50839 float64x2_t __s0_441 = __p0_441; \ 50840 float64x2_t __s1_441 = __p1_441; \ 50841 float64x2_t __s2_441 = __p2_441; \ 50842 float64x2_t __rev0_441; __rev0_441 = __builtin_shufflevector(__s0_441, __s0_441, 1, 0); \ 50843 float64x2_t __rev1_441; __rev1_441 = __builtin_shufflevector(__s1_441, __s1_441, 1, 0); \ 50844 float64x2_t __rev2_441; __rev2_441 = __builtin_shufflevector(__s2_441, __s2_441, 1, 0); \ 50845 __ret_441 = __noswap_vfmaq_laneq_f64(__rev0_441, -__rev1_441, __rev2_441, __p3_441); \ 50846 __ret_441 = __builtin_shufflevector(__ret_441, __ret_441, 1, 0); \ 50847 __ret_441; \ 50848 }) 50849 #endif 50850 50851 #ifdef __LITTLE_ENDIAN__ 50852 #define vfmsq_laneq_f32(__p0_442, __p1_442, __p2_442, __p3_442) __extension__ ({ \ 50853 float32x4_t __ret_442; \ 50854 float32x4_t __s0_442 = __p0_442; \ 50855 float32x4_t __s1_442 = __p1_442; \ 50856 float32x4_t __s2_442 = __p2_442; \ 50857 __ret_442 = vfmaq_laneq_f32(__s0_442, -__s1_442, __s2_442, __p3_442); \ 50858 __ret_442; \ 50859 }) 50860 #else 50861 #define vfmsq_laneq_f32(__p0_443, __p1_443, __p2_443, __p3_443) __extension__ ({ \ 50862 float32x4_t __ret_443; \ 50863 float32x4_t __s0_443 = __p0_443; \ 50864 float32x4_t __s1_443 = __p1_443; \ 50865 float32x4_t __s2_443 = __p2_443; \ 50866 float32x4_t __rev0_443; __rev0_443 = __builtin_shufflevector(__s0_443, __s0_443, 3, 2, 1, 0); \ 50867 float32x4_t __rev1_443; __rev1_443 = __builtin_shufflevector(__s1_443, __s1_443, 3, 2, 1, 0); \ 50868 float32x4_t __rev2_443; __rev2_443 = __builtin_shufflevector(__s2_443, __s2_443, 3, 2, 1, 0); \ 50869 __ret_443 = __noswap_vfmaq_laneq_f32(__rev0_443, -__rev1_443, __rev2_443, __p3_443); \ 50870 __ret_443 = __builtin_shufflevector(__ret_443, __ret_443, 3, 2, 1, 0); \ 50871 __ret_443; \ 50872 }) 50873 #endif 50874 50875 #ifdef __LITTLE_ENDIAN__ 50876 #define vfms_laneq_f64(__p0_444, __p1_444, __p2_444, __p3_444) __extension__ ({ \ 50877 float64x1_t __ret_444; \ 50878 float64x1_t __s0_444 = __p0_444; \ 50879 float64x1_t __s1_444 = __p1_444; \ 50880 float64x2_t __s2_444 = __p2_444; \ 50881 __ret_444 = vfma_laneq_f64(__s0_444, -__s1_444, __s2_444, __p3_444); \ 50882 __ret_444; \ 50883 }) 50884 #else 50885 #define vfms_laneq_f64(__p0_445, __p1_445, __p2_445, __p3_445) __extension__ ({ \ 50886 float64x1_t __ret_445; \ 50887 float64x1_t __s0_445 = __p0_445; \ 50888 float64x1_t __s1_445 = __p1_445; \ 50889 float64x2_t __s2_445 = __p2_445; \ 50890 float64x2_t __rev2_445; __rev2_445 = __builtin_shufflevector(__s2_445, __s2_445, 1, 0); \ 50891 __ret_445 = __noswap_vfma_laneq_f64(__s0_445, -__s1_445, __rev2_445, __p3_445); \ 50892 __ret_445; \ 50893 }) 50894 #endif 50895 50896 #ifdef __LITTLE_ENDIAN__ 50897 #define vfms_laneq_f32(__p0_446, __p1_446, __p2_446, __p3_446) __extension__ ({ \ 50898 float32x2_t __ret_446; \ 50899 float32x2_t __s0_446 = __p0_446; \ 50900 float32x2_t __s1_446 = __p1_446; \ 50901 float32x4_t __s2_446 = __p2_446; \ 50902 __ret_446 = vfma_laneq_f32(__s0_446, -__s1_446, __s2_446, __p3_446); \ 50903 __ret_446; \ 50904 }) 50905 #else 50906 #define vfms_laneq_f32(__p0_447, __p1_447, __p2_447, __p3_447) __extension__ ({ \ 50907 float32x2_t __ret_447; \ 50908 float32x2_t __s0_447 = __p0_447; \ 50909 float32x2_t __s1_447 = __p1_447; \ 50910 float32x4_t __s2_447 = __p2_447; \ 50911 float32x2_t __rev0_447; __rev0_447 = __builtin_shufflevector(__s0_447, __s0_447, 1, 0); \ 50912 float32x2_t __rev1_447; __rev1_447 = __builtin_shufflevector(__s1_447, __s1_447, 1, 0); \ 50913 float32x4_t __rev2_447; __rev2_447 = __builtin_shufflevector(__s2_447, __s2_447, 3, 2, 1, 0); \ 50914 __ret_447 = __noswap_vfma_laneq_f32(__rev0_447, -__rev1_447, __rev2_447, __p3_447); \ 50915 __ret_447 = __builtin_shufflevector(__ret_447, __ret_447, 1, 0); \ 50916 __ret_447; \ 50917 }) 50918 #endif 50919 50920 #ifdef __LITTLE_ENDIAN__ 50921 __ai __attribute__((target("neon"))) float64x2_t vfmsq_n_f64(float64x2_t __p0, float64x2_t __p1, float64_t __p2) { 50922 float64x2_t __ret; 50923 __ret = vfmaq_f64(__p0, -__p1, (float64x2_t) {__p2, __p2}); 50924 return __ret; 50925 } 50926 #else 50927 __ai __attribute__((target("neon"))) float64x2_t vfmsq_n_f64(float64x2_t __p0, float64x2_t __p1, float64_t __p2) { 50928 float64x2_t __ret; 50929 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 50930 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 50931 __ret = __noswap_vfmaq_f64(__rev0, -__rev1, (float64x2_t) {__p2, __p2}); 50932 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 50933 return __ret; 50934 } 50935 #endif 50936 50937 #ifdef __LITTLE_ENDIAN__ 50938 __ai __attribute__((target("neon"))) float32x4_t vfmsq_n_f32(float32x4_t __p0, float32x4_t __p1, float32_t __p2) { 50939 float32x4_t __ret; 50940 __ret = vfmaq_f32(__p0, -__p1, (float32x4_t) {__p2, __p2, __p2, __p2}); 50941 return __ret; 50942 } 50943 #else 50944 __ai __attribute__((target("neon"))) float32x4_t vfmsq_n_f32(float32x4_t __p0, float32x4_t __p1, float32_t __p2) { 50945 float32x4_t __ret; 50946 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 50947 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 50948 __ret = __noswap_vfmaq_f32(__rev0, -__rev1, (float32x4_t) {__p2, __p2, __p2, __p2}); 50949 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 50950 return __ret; 50951 } 50952 #endif 50953 50954 __ai __attribute__((target("neon"))) float64x1_t vfms_n_f64(float64x1_t __p0, float64x1_t __p1, float64_t __p2) { 50955 float64x1_t __ret; 50956 __ret = vfma_f64(__p0, -__p1, (float64x1_t) {__p2}); 50957 return __ret; 50958 } 50959 #ifdef __LITTLE_ENDIAN__ 50960 __ai __attribute__((target("neon"))) float32x2_t vfms_n_f32(float32x2_t __p0, float32x2_t __p1, float32_t __p2) { 50961 float32x2_t __ret; 50962 __ret = vfma_f32(__p0, -__p1, (float32x2_t) {__p2, __p2}); 50963 return __ret; 50964 } 50965 #else 50966 __ai __attribute__((target("neon"))) float32x2_t vfms_n_f32(float32x2_t __p0, float32x2_t __p1, float32_t __p2) { 50967 float32x2_t __ret; 50968 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 50969 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 50970 __ret = __noswap_vfma_f32(__rev0, -__rev1, (float32x2_t) {__p2, __p2}); 50971 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 50972 return __ret; 50973 } 50974 #endif 50975 50976 #ifdef __LITTLE_ENDIAN__ 50977 __ai __attribute__((target("neon"))) poly64x1_t vget_high_p64(poly64x2_t __p0) { 50978 poly64x1_t __ret; 50979 __ret = __builtin_shufflevector(__p0, __p0, 1); 50980 return __ret; 50981 } 50982 #else 50983 __ai __attribute__((target("neon"))) poly64x1_t vget_high_p64(poly64x2_t __p0) { 50984 poly64x1_t __ret; 50985 poly64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 50986 __ret = __builtin_shufflevector(__rev0, __rev0, 1); 50987 return __ret; 50988 } 50989 __ai __attribute__((target("neon"))) poly64x1_t __noswap_vget_high_p64(poly64x2_t __p0) { 50990 poly64x1_t __ret; 50991 __ret = __builtin_shufflevector(__p0, __p0, 1); 50992 return __ret; 50993 } 50994 #endif 50995 50996 #ifdef __LITTLE_ENDIAN__ 50997 __ai __attribute__((target("neon"))) float64x1_t vget_high_f64(float64x2_t __p0) { 50998 float64x1_t __ret; 50999 __ret = __builtin_shufflevector(__p0, __p0, 1); 51000 return __ret; 51001 } 51002 #else 51003 __ai __attribute__((target("neon"))) float64x1_t vget_high_f64(float64x2_t __p0) { 51004 float64x1_t __ret; 51005 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 51006 __ret = __builtin_shufflevector(__rev0, __rev0, 1); 51007 return __ret; 51008 } 51009 #endif 51010 51011 #define vget_lane_p64(__p0, __p1) __extension__ ({ \ 51012 poly64_t __ret; \ 51013 poly64x1_t __s0 = __p0; \ 51014 __ret = (poly64_t) __builtin_neon_vget_lane_i64((poly64x1_t)__s0, __p1); \ 51015 __ret; \ 51016 }) 51017 #ifdef __LITTLE_ENDIAN__ 51018 #define vgetq_lane_p64(__p0, __p1) __extension__ ({ \ 51019 poly64_t __ret; \ 51020 poly64x2_t __s0 = __p0; \ 51021 __ret = (poly64_t) __builtin_neon_vgetq_lane_i64((poly64x2_t)__s0, __p1); \ 51022 __ret; \ 51023 }) 51024 #else 51025 #define vgetq_lane_p64(__p0, __p1) __extension__ ({ \ 51026 poly64_t __ret; \ 51027 poly64x2_t __s0 = __p0; \ 51028 poly64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 51029 __ret = (poly64_t) __builtin_neon_vgetq_lane_i64((poly64x2_t)__rev0, __p1); \ 51030 __ret; \ 51031 }) 51032 #define __noswap_vgetq_lane_p64(__p0, __p1) __extension__ ({ \ 51033 poly64_t __ret; \ 51034 poly64x2_t __s0 = __p0; \ 51035 __ret = (poly64_t) __builtin_neon_vgetq_lane_i64((poly64x2_t)__s0, __p1); \ 51036 __ret; \ 51037 }) 51038 #endif 51039 51040 #ifdef __LITTLE_ENDIAN__ 51041 #define vgetq_lane_f64(__p0, __p1) __extension__ ({ \ 51042 float64_t __ret; \ 51043 float64x2_t __s0 = __p0; \ 51044 __ret = (float64_t) __builtin_neon_vgetq_lane_f64((float64x2_t)__s0, __p1); \ 51045 __ret; \ 51046 }) 51047 #else 51048 #define vgetq_lane_f64(__p0, __p1) __extension__ ({ \ 51049 float64_t __ret; \ 51050 float64x2_t __s0 = __p0; \ 51051 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 51052 __ret = (float64_t) __builtin_neon_vgetq_lane_f64((float64x2_t)__rev0, __p1); \ 51053 __ret; \ 51054 }) 51055 #define __noswap_vgetq_lane_f64(__p0, __p1) __extension__ ({ \ 51056 float64_t __ret; \ 51057 float64x2_t __s0 = __p0; \ 51058 __ret = (float64_t) __builtin_neon_vgetq_lane_f64((float64x2_t)__s0, __p1); \ 51059 __ret; \ 51060 }) 51061 #endif 51062 51063 #define vget_lane_f64(__p0, __p1) __extension__ ({ \ 51064 float64_t __ret; \ 51065 float64x1_t __s0 = __p0; \ 51066 __ret = (float64_t) __builtin_neon_vget_lane_f64((float64x1_t)__s0, __p1); \ 51067 __ret; \ 51068 }) 51069 #ifdef __LITTLE_ENDIAN__ 51070 __ai __attribute__((target("neon"))) poly64x1_t vget_low_p64(poly64x2_t __p0) { 51071 poly64x1_t __ret; 51072 __ret = __builtin_shufflevector(__p0, __p0, 0); 51073 return __ret; 51074 } 51075 #else 51076 __ai __attribute__((target("neon"))) poly64x1_t vget_low_p64(poly64x2_t __p0) { 51077 poly64x1_t __ret; 51078 poly64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 51079 __ret = __builtin_shufflevector(__rev0, __rev0, 0); 51080 return __ret; 51081 } 51082 #endif 51083 51084 #ifdef __LITTLE_ENDIAN__ 51085 __ai __attribute__((target("neon"))) float64x1_t vget_low_f64(float64x2_t __p0) { 51086 float64x1_t __ret; 51087 __ret = __builtin_shufflevector(__p0, __p0, 0); 51088 return __ret; 51089 } 51090 #else 51091 __ai __attribute__((target("neon"))) float64x1_t vget_low_f64(float64x2_t __p0) { 51092 float64x1_t __ret; 51093 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 51094 __ret = __builtin_shufflevector(__rev0, __rev0, 0); 51095 return __ret; 51096 } 51097 #endif 51098 51099 #define vld1_p64(__p0) __extension__ ({ \ 51100 poly64x1_t __ret; \ 51101 __ret = (poly64x1_t) __builtin_neon_vld1_v(__p0, 6); \ 51102 __ret; \ 51103 }) 51104 #ifdef __LITTLE_ENDIAN__ 51105 #define vld1q_p64(__p0) __extension__ ({ \ 51106 poly64x2_t __ret; \ 51107 __ret = (poly64x2_t) __builtin_neon_vld1q_v(__p0, 38); \ 51108 __ret; \ 51109 }) 51110 #else 51111 #define vld1q_p64(__p0) __extension__ ({ \ 51112 poly64x2_t __ret; \ 51113 __ret = (poly64x2_t) __builtin_neon_vld1q_v(__p0, 38); \ 51114 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 51115 __ret; \ 51116 }) 51117 #endif 51118 51119 #ifdef __LITTLE_ENDIAN__ 51120 #define vld1q_f64(__p0) __extension__ ({ \ 51121 float64x2_t __ret; \ 51122 __ret = (float64x2_t) __builtin_neon_vld1q_v(__p0, 42); \ 51123 __ret; \ 51124 }) 51125 #else 51126 #define vld1q_f64(__p0) __extension__ ({ \ 51127 float64x2_t __ret; \ 51128 __ret = (float64x2_t) __builtin_neon_vld1q_v(__p0, 42); \ 51129 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 51130 __ret; \ 51131 }) 51132 #endif 51133 51134 #define vld1_f64(__p0) __extension__ ({ \ 51135 float64x1_t __ret; \ 51136 __ret = (float64x1_t) __builtin_neon_vld1_v(__p0, 10); \ 51137 __ret; \ 51138 }) 51139 #define vld1_dup_p64(__p0) __extension__ ({ \ 51140 poly64x1_t __ret; \ 51141 __ret = (poly64x1_t) __builtin_neon_vld1_dup_v(__p0, 6); \ 51142 __ret; \ 51143 }) 51144 #ifdef __LITTLE_ENDIAN__ 51145 #define vld1q_dup_p64(__p0) __extension__ ({ \ 51146 poly64x2_t __ret; \ 51147 __ret = (poly64x2_t) __builtin_neon_vld1q_dup_v(__p0, 38); \ 51148 __ret; \ 51149 }) 51150 #else 51151 #define vld1q_dup_p64(__p0) __extension__ ({ \ 51152 poly64x2_t __ret; \ 51153 __ret = (poly64x2_t) __builtin_neon_vld1q_dup_v(__p0, 38); \ 51154 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 51155 __ret; \ 51156 }) 51157 #endif 51158 51159 #ifdef __LITTLE_ENDIAN__ 51160 #define vld1q_dup_f64(__p0) __extension__ ({ \ 51161 float64x2_t __ret; \ 51162 __ret = (float64x2_t) __builtin_neon_vld1q_dup_v(__p0, 42); \ 51163 __ret; \ 51164 }) 51165 #else 51166 #define vld1q_dup_f64(__p0) __extension__ ({ \ 51167 float64x2_t __ret; \ 51168 __ret = (float64x2_t) __builtin_neon_vld1q_dup_v(__p0, 42); \ 51169 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 51170 __ret; \ 51171 }) 51172 #endif 51173 51174 #define vld1_dup_f64(__p0) __extension__ ({ \ 51175 float64x1_t __ret; \ 51176 __ret = (float64x1_t) __builtin_neon_vld1_dup_v(__p0, 10); \ 51177 __ret; \ 51178 }) 51179 #define vld1_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 51180 poly64x1_t __ret; \ 51181 poly64x1_t __s1 = __p1; \ 51182 __ret = (poly64x1_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__s1, __p2, 6); \ 51183 __ret; \ 51184 }) 51185 #ifdef __LITTLE_ENDIAN__ 51186 #define vld1q_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 51187 poly64x2_t __ret; \ 51188 poly64x2_t __s1 = __p1; \ 51189 __ret = (poly64x2_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__s1, __p2, 38); \ 51190 __ret; \ 51191 }) 51192 #else 51193 #define vld1q_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 51194 poly64x2_t __ret; \ 51195 poly64x2_t __s1 = __p1; \ 51196 poly64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 51197 __ret = (poly64x2_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 38); \ 51198 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 51199 __ret; \ 51200 }) 51201 #endif 51202 51203 #ifdef __LITTLE_ENDIAN__ 51204 #define vld1q_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 51205 float64x2_t __ret; \ 51206 float64x2_t __s1 = __p1; \ 51207 __ret = (float64x2_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__s1, __p2, 42); \ 51208 __ret; \ 51209 }) 51210 #else 51211 #define vld1q_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 51212 float64x2_t __ret; \ 51213 float64x2_t __s1 = __p1; \ 51214 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 51215 __ret = (float64x2_t) __builtin_neon_vld1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 42); \ 51216 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 51217 __ret; \ 51218 }) 51219 #endif 51220 51221 #define vld1_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 51222 float64x1_t __ret; \ 51223 float64x1_t __s1 = __p1; \ 51224 __ret = (float64x1_t) __builtin_neon_vld1_lane_v(__p0, (int8x8_t)__s1, __p2, 10); \ 51225 __ret; \ 51226 }) 51227 #define vld1_p64_x2(__p0) __extension__ ({ \ 51228 poly64x1x2_t __ret; \ 51229 __builtin_neon_vld1_x2_v(&__ret, __p0, 6); \ 51230 __ret; \ 51231 }) 51232 #ifdef __LITTLE_ENDIAN__ 51233 #define vld1q_p64_x2(__p0) __extension__ ({ \ 51234 poly64x2x2_t __ret; \ 51235 __builtin_neon_vld1q_x2_v(&__ret, __p0, 38); \ 51236 __ret; \ 51237 }) 51238 #else 51239 #define vld1q_p64_x2(__p0) __extension__ ({ \ 51240 poly64x2x2_t __ret; \ 51241 __builtin_neon_vld1q_x2_v(&__ret, __p0, 38); \ 51242 \ 51243 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 51244 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 51245 __ret; \ 51246 }) 51247 #endif 51248 51249 #ifdef __LITTLE_ENDIAN__ 51250 #define vld1q_f64_x2(__p0) __extension__ ({ \ 51251 float64x2x2_t __ret; \ 51252 __builtin_neon_vld1q_x2_v(&__ret, __p0, 42); \ 51253 __ret; \ 51254 }) 51255 #else 51256 #define vld1q_f64_x2(__p0) __extension__ ({ \ 51257 float64x2x2_t __ret; \ 51258 __builtin_neon_vld1q_x2_v(&__ret, __p0, 42); \ 51259 \ 51260 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 51261 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 51262 __ret; \ 51263 }) 51264 #endif 51265 51266 #define vld1_f64_x2(__p0) __extension__ ({ \ 51267 float64x1x2_t __ret; \ 51268 __builtin_neon_vld1_x2_v(&__ret, __p0, 10); \ 51269 __ret; \ 51270 }) 51271 #define vld1_p64_x3(__p0) __extension__ ({ \ 51272 poly64x1x3_t __ret; \ 51273 __builtin_neon_vld1_x3_v(&__ret, __p0, 6); \ 51274 __ret; \ 51275 }) 51276 #ifdef __LITTLE_ENDIAN__ 51277 #define vld1q_p64_x3(__p0) __extension__ ({ \ 51278 poly64x2x3_t __ret; \ 51279 __builtin_neon_vld1q_x3_v(&__ret, __p0, 38); \ 51280 __ret; \ 51281 }) 51282 #else 51283 #define vld1q_p64_x3(__p0) __extension__ ({ \ 51284 poly64x2x3_t __ret; \ 51285 __builtin_neon_vld1q_x3_v(&__ret, __p0, 38); \ 51286 \ 51287 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 51288 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 51289 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 51290 __ret; \ 51291 }) 51292 #endif 51293 51294 #ifdef __LITTLE_ENDIAN__ 51295 #define vld1q_f64_x3(__p0) __extension__ ({ \ 51296 float64x2x3_t __ret; \ 51297 __builtin_neon_vld1q_x3_v(&__ret, __p0, 42); \ 51298 __ret; \ 51299 }) 51300 #else 51301 #define vld1q_f64_x3(__p0) __extension__ ({ \ 51302 float64x2x3_t __ret; \ 51303 __builtin_neon_vld1q_x3_v(&__ret, __p0, 42); \ 51304 \ 51305 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 51306 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 51307 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 51308 __ret; \ 51309 }) 51310 #endif 51311 51312 #define vld1_f64_x3(__p0) __extension__ ({ \ 51313 float64x1x3_t __ret; \ 51314 __builtin_neon_vld1_x3_v(&__ret, __p0, 10); \ 51315 __ret; \ 51316 }) 51317 #define vld1_p64_x4(__p0) __extension__ ({ \ 51318 poly64x1x4_t __ret; \ 51319 __builtin_neon_vld1_x4_v(&__ret, __p0, 6); \ 51320 __ret; \ 51321 }) 51322 #ifdef __LITTLE_ENDIAN__ 51323 #define vld1q_p64_x4(__p0) __extension__ ({ \ 51324 poly64x2x4_t __ret; \ 51325 __builtin_neon_vld1q_x4_v(&__ret, __p0, 38); \ 51326 __ret; \ 51327 }) 51328 #else 51329 #define vld1q_p64_x4(__p0) __extension__ ({ \ 51330 poly64x2x4_t __ret; \ 51331 __builtin_neon_vld1q_x4_v(&__ret, __p0, 38); \ 51332 \ 51333 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 51334 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 51335 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 51336 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \ 51337 __ret; \ 51338 }) 51339 #endif 51340 51341 #ifdef __LITTLE_ENDIAN__ 51342 #define vld1q_f64_x4(__p0) __extension__ ({ \ 51343 float64x2x4_t __ret; \ 51344 __builtin_neon_vld1q_x4_v(&__ret, __p0, 42); \ 51345 __ret; \ 51346 }) 51347 #else 51348 #define vld1q_f64_x4(__p0) __extension__ ({ \ 51349 float64x2x4_t __ret; \ 51350 __builtin_neon_vld1q_x4_v(&__ret, __p0, 42); \ 51351 \ 51352 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 51353 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 51354 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 51355 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \ 51356 __ret; \ 51357 }) 51358 #endif 51359 51360 #define vld1_f64_x4(__p0) __extension__ ({ \ 51361 float64x1x4_t __ret; \ 51362 __builtin_neon_vld1_x4_v(&__ret, __p0, 10); \ 51363 __ret; \ 51364 }) 51365 #define vld2_p64(__p0) __extension__ ({ \ 51366 poly64x1x2_t __ret; \ 51367 __builtin_neon_vld2_v(&__ret, __p0, 6); \ 51368 __ret; \ 51369 }) 51370 #ifdef __LITTLE_ENDIAN__ 51371 #define vld2q_p64(__p0) __extension__ ({ \ 51372 poly64x2x2_t __ret; \ 51373 __builtin_neon_vld2q_v(&__ret, __p0, 38); \ 51374 __ret; \ 51375 }) 51376 #else 51377 #define vld2q_p64(__p0) __extension__ ({ \ 51378 poly64x2x2_t __ret; \ 51379 __builtin_neon_vld2q_v(&__ret, __p0, 38); \ 51380 \ 51381 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 51382 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 51383 __ret; \ 51384 }) 51385 #endif 51386 51387 #ifdef __LITTLE_ENDIAN__ 51388 #define vld2q_u64(__p0) __extension__ ({ \ 51389 uint64x2x2_t __ret; \ 51390 __builtin_neon_vld2q_v(&__ret, __p0, 51); \ 51391 __ret; \ 51392 }) 51393 #else 51394 #define vld2q_u64(__p0) __extension__ ({ \ 51395 uint64x2x2_t __ret; \ 51396 __builtin_neon_vld2q_v(&__ret, __p0, 51); \ 51397 \ 51398 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 51399 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 51400 __ret; \ 51401 }) 51402 #endif 51403 51404 #ifdef __LITTLE_ENDIAN__ 51405 #define vld2q_f64(__p0) __extension__ ({ \ 51406 float64x2x2_t __ret; \ 51407 __builtin_neon_vld2q_v(&__ret, __p0, 42); \ 51408 __ret; \ 51409 }) 51410 #else 51411 #define vld2q_f64(__p0) __extension__ ({ \ 51412 float64x2x2_t __ret; \ 51413 __builtin_neon_vld2q_v(&__ret, __p0, 42); \ 51414 \ 51415 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 51416 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 51417 __ret; \ 51418 }) 51419 #endif 51420 51421 #ifdef __LITTLE_ENDIAN__ 51422 #define vld2q_s64(__p0) __extension__ ({ \ 51423 int64x2x2_t __ret; \ 51424 __builtin_neon_vld2q_v(&__ret, __p0, 35); \ 51425 __ret; \ 51426 }) 51427 #else 51428 #define vld2q_s64(__p0) __extension__ ({ \ 51429 int64x2x2_t __ret; \ 51430 __builtin_neon_vld2q_v(&__ret, __p0, 35); \ 51431 \ 51432 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 51433 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 51434 __ret; \ 51435 }) 51436 #endif 51437 51438 #define vld2_f64(__p0) __extension__ ({ \ 51439 float64x1x2_t __ret; \ 51440 __builtin_neon_vld2_v(&__ret, __p0, 10); \ 51441 __ret; \ 51442 }) 51443 #define vld2_dup_p64(__p0) __extension__ ({ \ 51444 poly64x1x2_t __ret; \ 51445 __builtin_neon_vld2_dup_v(&__ret, __p0, 6); \ 51446 __ret; \ 51447 }) 51448 #ifdef __LITTLE_ENDIAN__ 51449 #define vld2q_dup_p64(__p0) __extension__ ({ \ 51450 poly64x2x2_t __ret; \ 51451 __builtin_neon_vld2q_dup_v(&__ret, __p0, 38); \ 51452 __ret; \ 51453 }) 51454 #else 51455 #define vld2q_dup_p64(__p0) __extension__ ({ \ 51456 poly64x2x2_t __ret; \ 51457 __builtin_neon_vld2q_dup_v(&__ret, __p0, 38); \ 51458 \ 51459 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 51460 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 51461 __ret; \ 51462 }) 51463 #endif 51464 51465 #ifdef __LITTLE_ENDIAN__ 51466 #define vld2q_dup_f64(__p0) __extension__ ({ \ 51467 float64x2x2_t __ret; \ 51468 __builtin_neon_vld2q_dup_v(&__ret, __p0, 42); \ 51469 __ret; \ 51470 }) 51471 #else 51472 #define vld2q_dup_f64(__p0) __extension__ ({ \ 51473 float64x2x2_t __ret; \ 51474 __builtin_neon_vld2q_dup_v(&__ret, __p0, 42); \ 51475 \ 51476 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 51477 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 51478 __ret; \ 51479 }) 51480 #endif 51481 51482 #define vld2_dup_f64(__p0) __extension__ ({ \ 51483 float64x1x2_t __ret; \ 51484 __builtin_neon_vld2_dup_v(&__ret, __p0, 10); \ 51485 __ret; \ 51486 }) 51487 #define vld2_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 51488 poly64x1x2_t __ret; \ 51489 poly64x1x2_t __s1 = __p1; \ 51490 __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 6); \ 51491 __ret; \ 51492 }) 51493 #ifdef __LITTLE_ENDIAN__ 51494 #define vld2q_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 51495 poly8x16x2_t __ret; \ 51496 poly8x16x2_t __s1 = __p1; \ 51497 __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 36); \ 51498 __ret; \ 51499 }) 51500 #else 51501 #define vld2q_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 51502 poly8x16x2_t __ret; \ 51503 poly8x16x2_t __s1 = __p1; \ 51504 poly8x16x2_t __rev1; \ 51505 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 51506 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 51507 __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 36); \ 51508 \ 51509 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 51510 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 51511 __ret; \ 51512 }) 51513 #endif 51514 51515 #ifdef __LITTLE_ENDIAN__ 51516 #define vld2q_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 51517 poly64x2x2_t __ret; \ 51518 poly64x2x2_t __s1 = __p1; \ 51519 __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 38); \ 51520 __ret; \ 51521 }) 51522 #else 51523 #define vld2q_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 51524 poly64x2x2_t __ret; \ 51525 poly64x2x2_t __s1 = __p1; \ 51526 poly64x2x2_t __rev1; \ 51527 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 51528 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 51529 __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 38); \ 51530 \ 51531 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 51532 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 51533 __ret; \ 51534 }) 51535 #endif 51536 51537 #ifdef __LITTLE_ENDIAN__ 51538 #define vld2q_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 51539 uint8x16x2_t __ret; \ 51540 uint8x16x2_t __s1 = __p1; \ 51541 __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 48); \ 51542 __ret; \ 51543 }) 51544 #else 51545 #define vld2q_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 51546 uint8x16x2_t __ret; \ 51547 uint8x16x2_t __s1 = __p1; \ 51548 uint8x16x2_t __rev1; \ 51549 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 51550 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 51551 __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 48); \ 51552 \ 51553 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 51554 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 51555 __ret; \ 51556 }) 51557 #endif 51558 51559 #ifdef __LITTLE_ENDIAN__ 51560 #define vld2q_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 51561 uint64x2x2_t __ret; \ 51562 uint64x2x2_t __s1 = __p1; \ 51563 __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 51); \ 51564 __ret; \ 51565 }) 51566 #else 51567 #define vld2q_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 51568 uint64x2x2_t __ret; \ 51569 uint64x2x2_t __s1 = __p1; \ 51570 uint64x2x2_t __rev1; \ 51571 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 51572 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 51573 __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 51); \ 51574 \ 51575 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 51576 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 51577 __ret; \ 51578 }) 51579 #endif 51580 51581 #ifdef __LITTLE_ENDIAN__ 51582 #define vld2q_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 51583 int8x16x2_t __ret; \ 51584 int8x16x2_t __s1 = __p1; \ 51585 __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 32); \ 51586 __ret; \ 51587 }) 51588 #else 51589 #define vld2q_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 51590 int8x16x2_t __ret; \ 51591 int8x16x2_t __s1 = __p1; \ 51592 int8x16x2_t __rev1; \ 51593 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 51594 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 51595 __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 32); \ 51596 \ 51597 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 51598 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 51599 __ret; \ 51600 }) 51601 #endif 51602 51603 #ifdef __LITTLE_ENDIAN__ 51604 #define vld2q_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 51605 float64x2x2_t __ret; \ 51606 float64x2x2_t __s1 = __p1; \ 51607 __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 42); \ 51608 __ret; \ 51609 }) 51610 #else 51611 #define vld2q_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 51612 float64x2x2_t __ret; \ 51613 float64x2x2_t __s1 = __p1; \ 51614 float64x2x2_t __rev1; \ 51615 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 51616 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 51617 __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 42); \ 51618 \ 51619 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 51620 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 51621 __ret; \ 51622 }) 51623 #endif 51624 51625 #ifdef __LITTLE_ENDIAN__ 51626 #define vld2q_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 51627 int64x2x2_t __ret; \ 51628 int64x2x2_t __s1 = __p1; \ 51629 __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 35); \ 51630 __ret; \ 51631 }) 51632 #else 51633 #define vld2q_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 51634 int64x2x2_t __ret; \ 51635 int64x2x2_t __s1 = __p1; \ 51636 int64x2x2_t __rev1; \ 51637 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 51638 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 51639 __builtin_neon_vld2q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 35); \ 51640 \ 51641 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 51642 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 51643 __ret; \ 51644 }) 51645 #endif 51646 51647 #define vld2_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 51648 uint64x1x2_t __ret; \ 51649 uint64x1x2_t __s1 = __p1; \ 51650 __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 19); \ 51651 __ret; \ 51652 }) 51653 #define vld2_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 51654 float64x1x2_t __ret; \ 51655 float64x1x2_t __s1 = __p1; \ 51656 __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 10); \ 51657 __ret; \ 51658 }) 51659 #define vld2_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 51660 int64x1x2_t __ret; \ 51661 int64x1x2_t __s1 = __p1; \ 51662 __builtin_neon_vld2_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 3); \ 51663 __ret; \ 51664 }) 51665 #define vld3_p64(__p0) __extension__ ({ \ 51666 poly64x1x3_t __ret; \ 51667 __builtin_neon_vld3_v(&__ret, __p0, 6); \ 51668 __ret; \ 51669 }) 51670 #ifdef __LITTLE_ENDIAN__ 51671 #define vld3q_p64(__p0) __extension__ ({ \ 51672 poly64x2x3_t __ret; \ 51673 __builtin_neon_vld3q_v(&__ret, __p0, 38); \ 51674 __ret; \ 51675 }) 51676 #else 51677 #define vld3q_p64(__p0) __extension__ ({ \ 51678 poly64x2x3_t __ret; \ 51679 __builtin_neon_vld3q_v(&__ret, __p0, 38); \ 51680 \ 51681 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 51682 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 51683 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 51684 __ret; \ 51685 }) 51686 #endif 51687 51688 #ifdef __LITTLE_ENDIAN__ 51689 #define vld3q_u64(__p0) __extension__ ({ \ 51690 uint64x2x3_t __ret; \ 51691 __builtin_neon_vld3q_v(&__ret, __p0, 51); \ 51692 __ret; \ 51693 }) 51694 #else 51695 #define vld3q_u64(__p0) __extension__ ({ \ 51696 uint64x2x3_t __ret; \ 51697 __builtin_neon_vld3q_v(&__ret, __p0, 51); \ 51698 \ 51699 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 51700 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 51701 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 51702 __ret; \ 51703 }) 51704 #endif 51705 51706 #ifdef __LITTLE_ENDIAN__ 51707 #define vld3q_f64(__p0) __extension__ ({ \ 51708 float64x2x3_t __ret; \ 51709 __builtin_neon_vld3q_v(&__ret, __p0, 42); \ 51710 __ret; \ 51711 }) 51712 #else 51713 #define vld3q_f64(__p0) __extension__ ({ \ 51714 float64x2x3_t __ret; \ 51715 __builtin_neon_vld3q_v(&__ret, __p0, 42); \ 51716 \ 51717 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 51718 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 51719 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 51720 __ret; \ 51721 }) 51722 #endif 51723 51724 #ifdef __LITTLE_ENDIAN__ 51725 #define vld3q_s64(__p0) __extension__ ({ \ 51726 int64x2x3_t __ret; \ 51727 __builtin_neon_vld3q_v(&__ret, __p0, 35); \ 51728 __ret; \ 51729 }) 51730 #else 51731 #define vld3q_s64(__p0) __extension__ ({ \ 51732 int64x2x3_t __ret; \ 51733 __builtin_neon_vld3q_v(&__ret, __p0, 35); \ 51734 \ 51735 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 51736 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 51737 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 51738 __ret; \ 51739 }) 51740 #endif 51741 51742 #define vld3_f64(__p0) __extension__ ({ \ 51743 float64x1x3_t __ret; \ 51744 __builtin_neon_vld3_v(&__ret, __p0, 10); \ 51745 __ret; \ 51746 }) 51747 #define vld3_dup_p64(__p0) __extension__ ({ \ 51748 poly64x1x3_t __ret; \ 51749 __builtin_neon_vld3_dup_v(&__ret, __p0, 6); \ 51750 __ret; \ 51751 }) 51752 #ifdef __LITTLE_ENDIAN__ 51753 #define vld3q_dup_p64(__p0) __extension__ ({ \ 51754 poly64x2x3_t __ret; \ 51755 __builtin_neon_vld3q_dup_v(&__ret, __p0, 38); \ 51756 __ret; \ 51757 }) 51758 #else 51759 #define vld3q_dup_p64(__p0) __extension__ ({ \ 51760 poly64x2x3_t __ret; \ 51761 __builtin_neon_vld3q_dup_v(&__ret, __p0, 38); \ 51762 \ 51763 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 51764 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 51765 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 51766 __ret; \ 51767 }) 51768 #endif 51769 51770 #ifdef __LITTLE_ENDIAN__ 51771 #define vld3q_dup_f64(__p0) __extension__ ({ \ 51772 float64x2x3_t __ret; \ 51773 __builtin_neon_vld3q_dup_v(&__ret, __p0, 42); \ 51774 __ret; \ 51775 }) 51776 #else 51777 #define vld3q_dup_f64(__p0) __extension__ ({ \ 51778 float64x2x3_t __ret; \ 51779 __builtin_neon_vld3q_dup_v(&__ret, __p0, 42); \ 51780 \ 51781 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 51782 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 51783 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 51784 __ret; \ 51785 }) 51786 #endif 51787 51788 #define vld3_dup_f64(__p0) __extension__ ({ \ 51789 float64x1x3_t __ret; \ 51790 __builtin_neon_vld3_dup_v(&__ret, __p0, 10); \ 51791 __ret; \ 51792 }) 51793 #define vld3_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 51794 poly64x1x3_t __ret; \ 51795 poly64x1x3_t __s1 = __p1; \ 51796 __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 6); \ 51797 __ret; \ 51798 }) 51799 #ifdef __LITTLE_ENDIAN__ 51800 #define vld3q_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 51801 poly8x16x3_t __ret; \ 51802 poly8x16x3_t __s1 = __p1; \ 51803 __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 36); \ 51804 __ret; \ 51805 }) 51806 #else 51807 #define vld3q_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 51808 poly8x16x3_t __ret; \ 51809 poly8x16x3_t __s1 = __p1; \ 51810 poly8x16x3_t __rev1; \ 51811 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 51812 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 51813 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 51814 __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 36); \ 51815 \ 51816 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 51817 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 51818 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 51819 __ret; \ 51820 }) 51821 #endif 51822 51823 #ifdef __LITTLE_ENDIAN__ 51824 #define vld3q_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 51825 poly64x2x3_t __ret; \ 51826 poly64x2x3_t __s1 = __p1; \ 51827 __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 38); \ 51828 __ret; \ 51829 }) 51830 #else 51831 #define vld3q_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 51832 poly64x2x3_t __ret; \ 51833 poly64x2x3_t __s1 = __p1; \ 51834 poly64x2x3_t __rev1; \ 51835 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 51836 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 51837 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 51838 __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 38); \ 51839 \ 51840 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 51841 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 51842 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 51843 __ret; \ 51844 }) 51845 #endif 51846 51847 #ifdef __LITTLE_ENDIAN__ 51848 #define vld3q_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 51849 uint8x16x3_t __ret; \ 51850 uint8x16x3_t __s1 = __p1; \ 51851 __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 48); \ 51852 __ret; \ 51853 }) 51854 #else 51855 #define vld3q_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 51856 uint8x16x3_t __ret; \ 51857 uint8x16x3_t __s1 = __p1; \ 51858 uint8x16x3_t __rev1; \ 51859 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 51860 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 51861 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 51862 __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 48); \ 51863 \ 51864 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 51865 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 51866 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 51867 __ret; \ 51868 }) 51869 #endif 51870 51871 #ifdef __LITTLE_ENDIAN__ 51872 #define vld3q_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 51873 uint64x2x3_t __ret; \ 51874 uint64x2x3_t __s1 = __p1; \ 51875 __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 51); \ 51876 __ret; \ 51877 }) 51878 #else 51879 #define vld3q_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 51880 uint64x2x3_t __ret; \ 51881 uint64x2x3_t __s1 = __p1; \ 51882 uint64x2x3_t __rev1; \ 51883 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 51884 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 51885 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 51886 __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 51); \ 51887 \ 51888 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 51889 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 51890 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 51891 __ret; \ 51892 }) 51893 #endif 51894 51895 #ifdef __LITTLE_ENDIAN__ 51896 #define vld3q_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 51897 int8x16x3_t __ret; \ 51898 int8x16x3_t __s1 = __p1; \ 51899 __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 32); \ 51900 __ret; \ 51901 }) 51902 #else 51903 #define vld3q_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 51904 int8x16x3_t __ret; \ 51905 int8x16x3_t __s1 = __p1; \ 51906 int8x16x3_t __rev1; \ 51907 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 51908 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 51909 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 51910 __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 32); \ 51911 \ 51912 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 51913 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 51914 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 51915 __ret; \ 51916 }) 51917 #endif 51918 51919 #ifdef __LITTLE_ENDIAN__ 51920 #define vld3q_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 51921 float64x2x3_t __ret; \ 51922 float64x2x3_t __s1 = __p1; \ 51923 __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 42); \ 51924 __ret; \ 51925 }) 51926 #else 51927 #define vld3q_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 51928 float64x2x3_t __ret; \ 51929 float64x2x3_t __s1 = __p1; \ 51930 float64x2x3_t __rev1; \ 51931 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 51932 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 51933 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 51934 __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 42); \ 51935 \ 51936 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 51937 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 51938 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 51939 __ret; \ 51940 }) 51941 #endif 51942 51943 #ifdef __LITTLE_ENDIAN__ 51944 #define vld3q_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 51945 int64x2x3_t __ret; \ 51946 int64x2x3_t __s1 = __p1; \ 51947 __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 35); \ 51948 __ret; \ 51949 }) 51950 #else 51951 #define vld3q_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 51952 int64x2x3_t __ret; \ 51953 int64x2x3_t __s1 = __p1; \ 51954 int64x2x3_t __rev1; \ 51955 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 51956 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 51957 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 51958 __builtin_neon_vld3q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 35); \ 51959 \ 51960 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 51961 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 51962 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 51963 __ret; \ 51964 }) 51965 #endif 51966 51967 #define vld3_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 51968 uint64x1x3_t __ret; \ 51969 uint64x1x3_t __s1 = __p1; \ 51970 __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 19); \ 51971 __ret; \ 51972 }) 51973 #define vld3_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 51974 float64x1x3_t __ret; \ 51975 float64x1x3_t __s1 = __p1; \ 51976 __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 10); \ 51977 __ret; \ 51978 }) 51979 #define vld3_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 51980 int64x1x3_t __ret; \ 51981 int64x1x3_t __s1 = __p1; \ 51982 __builtin_neon_vld3_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 3); \ 51983 __ret; \ 51984 }) 51985 #define vld4_p64(__p0) __extension__ ({ \ 51986 poly64x1x4_t __ret; \ 51987 __builtin_neon_vld4_v(&__ret, __p0, 6); \ 51988 __ret; \ 51989 }) 51990 #ifdef __LITTLE_ENDIAN__ 51991 #define vld4q_p64(__p0) __extension__ ({ \ 51992 poly64x2x4_t __ret; \ 51993 __builtin_neon_vld4q_v(&__ret, __p0, 38); \ 51994 __ret; \ 51995 }) 51996 #else 51997 #define vld4q_p64(__p0) __extension__ ({ \ 51998 poly64x2x4_t __ret; \ 51999 __builtin_neon_vld4q_v(&__ret, __p0, 38); \ 52000 \ 52001 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 52002 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 52003 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 52004 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \ 52005 __ret; \ 52006 }) 52007 #endif 52008 52009 #ifdef __LITTLE_ENDIAN__ 52010 #define vld4q_u64(__p0) __extension__ ({ \ 52011 uint64x2x4_t __ret; \ 52012 __builtin_neon_vld4q_v(&__ret, __p0, 51); \ 52013 __ret; \ 52014 }) 52015 #else 52016 #define vld4q_u64(__p0) __extension__ ({ \ 52017 uint64x2x4_t __ret; \ 52018 __builtin_neon_vld4q_v(&__ret, __p0, 51); \ 52019 \ 52020 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 52021 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 52022 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 52023 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \ 52024 __ret; \ 52025 }) 52026 #endif 52027 52028 #ifdef __LITTLE_ENDIAN__ 52029 #define vld4q_f64(__p0) __extension__ ({ \ 52030 float64x2x4_t __ret; \ 52031 __builtin_neon_vld4q_v(&__ret, __p0, 42); \ 52032 __ret; \ 52033 }) 52034 #else 52035 #define vld4q_f64(__p0) __extension__ ({ \ 52036 float64x2x4_t __ret; \ 52037 __builtin_neon_vld4q_v(&__ret, __p0, 42); \ 52038 \ 52039 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 52040 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 52041 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 52042 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \ 52043 __ret; \ 52044 }) 52045 #endif 52046 52047 #ifdef __LITTLE_ENDIAN__ 52048 #define vld4q_s64(__p0) __extension__ ({ \ 52049 int64x2x4_t __ret; \ 52050 __builtin_neon_vld4q_v(&__ret, __p0, 35); \ 52051 __ret; \ 52052 }) 52053 #else 52054 #define vld4q_s64(__p0) __extension__ ({ \ 52055 int64x2x4_t __ret; \ 52056 __builtin_neon_vld4q_v(&__ret, __p0, 35); \ 52057 \ 52058 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 52059 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 52060 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 52061 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \ 52062 __ret; \ 52063 }) 52064 #endif 52065 52066 #define vld4_f64(__p0) __extension__ ({ \ 52067 float64x1x4_t __ret; \ 52068 __builtin_neon_vld4_v(&__ret, __p0, 10); \ 52069 __ret; \ 52070 }) 52071 #define vld4_dup_p64(__p0) __extension__ ({ \ 52072 poly64x1x4_t __ret; \ 52073 __builtin_neon_vld4_dup_v(&__ret, __p0, 6); \ 52074 __ret; \ 52075 }) 52076 #ifdef __LITTLE_ENDIAN__ 52077 #define vld4q_dup_p64(__p0) __extension__ ({ \ 52078 poly64x2x4_t __ret; \ 52079 __builtin_neon_vld4q_dup_v(&__ret, __p0, 38); \ 52080 __ret; \ 52081 }) 52082 #else 52083 #define vld4q_dup_p64(__p0) __extension__ ({ \ 52084 poly64x2x4_t __ret; \ 52085 __builtin_neon_vld4q_dup_v(&__ret, __p0, 38); \ 52086 \ 52087 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 52088 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 52089 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 52090 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \ 52091 __ret; \ 52092 }) 52093 #endif 52094 52095 #ifdef __LITTLE_ENDIAN__ 52096 #define vld4q_dup_f64(__p0) __extension__ ({ \ 52097 float64x2x4_t __ret; \ 52098 __builtin_neon_vld4q_dup_v(&__ret, __p0, 42); \ 52099 __ret; \ 52100 }) 52101 #else 52102 #define vld4q_dup_f64(__p0) __extension__ ({ \ 52103 float64x2x4_t __ret; \ 52104 __builtin_neon_vld4q_dup_v(&__ret, __p0, 42); \ 52105 \ 52106 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 52107 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 52108 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 52109 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \ 52110 __ret; \ 52111 }) 52112 #endif 52113 52114 #define vld4_dup_f64(__p0) __extension__ ({ \ 52115 float64x1x4_t __ret; \ 52116 __builtin_neon_vld4_dup_v(&__ret, __p0, 10); \ 52117 __ret; \ 52118 }) 52119 #define vld4_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 52120 poly64x1x4_t __ret; \ 52121 poly64x1x4_t __s1 = __p1; \ 52122 __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 6); \ 52123 __ret; \ 52124 }) 52125 #ifdef __LITTLE_ENDIAN__ 52126 #define vld4q_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 52127 poly8x16x4_t __ret; \ 52128 poly8x16x4_t __s1 = __p1; \ 52129 __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 36); \ 52130 __ret; \ 52131 }) 52132 #else 52133 #define vld4q_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 52134 poly8x16x4_t __ret; \ 52135 poly8x16x4_t __s1 = __p1; \ 52136 poly8x16x4_t __rev1; \ 52137 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 52138 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 52139 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 52140 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 52141 __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 36); \ 52142 \ 52143 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 52144 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 52145 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 52146 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 52147 __ret; \ 52148 }) 52149 #endif 52150 52151 #ifdef __LITTLE_ENDIAN__ 52152 #define vld4q_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 52153 poly64x2x4_t __ret; \ 52154 poly64x2x4_t __s1 = __p1; \ 52155 __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 38); \ 52156 __ret; \ 52157 }) 52158 #else 52159 #define vld4q_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 52160 poly64x2x4_t __ret; \ 52161 poly64x2x4_t __s1 = __p1; \ 52162 poly64x2x4_t __rev1; \ 52163 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 52164 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 52165 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 52166 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \ 52167 __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 38); \ 52168 \ 52169 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 52170 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 52171 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 52172 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \ 52173 __ret; \ 52174 }) 52175 #endif 52176 52177 #ifdef __LITTLE_ENDIAN__ 52178 #define vld4q_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 52179 uint8x16x4_t __ret; \ 52180 uint8x16x4_t __s1 = __p1; \ 52181 __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 48); \ 52182 __ret; \ 52183 }) 52184 #else 52185 #define vld4q_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 52186 uint8x16x4_t __ret; \ 52187 uint8x16x4_t __s1 = __p1; \ 52188 uint8x16x4_t __rev1; \ 52189 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 52190 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 52191 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 52192 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 52193 __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 48); \ 52194 \ 52195 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 52196 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 52197 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 52198 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 52199 __ret; \ 52200 }) 52201 #endif 52202 52203 #ifdef __LITTLE_ENDIAN__ 52204 #define vld4q_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 52205 uint64x2x4_t __ret; \ 52206 uint64x2x4_t __s1 = __p1; \ 52207 __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 51); \ 52208 __ret; \ 52209 }) 52210 #else 52211 #define vld4q_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 52212 uint64x2x4_t __ret; \ 52213 uint64x2x4_t __s1 = __p1; \ 52214 uint64x2x4_t __rev1; \ 52215 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 52216 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 52217 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 52218 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \ 52219 __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 51); \ 52220 \ 52221 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 52222 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 52223 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 52224 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \ 52225 __ret; \ 52226 }) 52227 #endif 52228 52229 #ifdef __LITTLE_ENDIAN__ 52230 #define vld4q_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 52231 int8x16x4_t __ret; \ 52232 int8x16x4_t __s1 = __p1; \ 52233 __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 32); \ 52234 __ret; \ 52235 }) 52236 #else 52237 #define vld4q_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 52238 int8x16x4_t __ret; \ 52239 int8x16x4_t __s1 = __p1; \ 52240 int8x16x4_t __rev1; \ 52241 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 52242 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 52243 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 52244 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 52245 __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 32); \ 52246 \ 52247 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 52248 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 52249 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 52250 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 52251 __ret; \ 52252 }) 52253 #endif 52254 52255 #ifdef __LITTLE_ENDIAN__ 52256 #define vld4q_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 52257 float64x2x4_t __ret; \ 52258 float64x2x4_t __s1 = __p1; \ 52259 __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 42); \ 52260 __ret; \ 52261 }) 52262 #else 52263 #define vld4q_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 52264 float64x2x4_t __ret; \ 52265 float64x2x4_t __s1 = __p1; \ 52266 float64x2x4_t __rev1; \ 52267 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 52268 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 52269 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 52270 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \ 52271 __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 42); \ 52272 \ 52273 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 52274 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 52275 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 52276 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \ 52277 __ret; \ 52278 }) 52279 #endif 52280 52281 #ifdef __LITTLE_ENDIAN__ 52282 #define vld4q_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 52283 int64x2x4_t __ret; \ 52284 int64x2x4_t __s1 = __p1; \ 52285 __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 35); \ 52286 __ret; \ 52287 }) 52288 #else 52289 #define vld4q_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 52290 int64x2x4_t __ret; \ 52291 int64x2x4_t __s1 = __p1; \ 52292 int64x2x4_t __rev1; \ 52293 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 52294 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 52295 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 52296 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \ 52297 __builtin_neon_vld4q_lane_v(&__ret, __p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 35); \ 52298 \ 52299 __ret.val[0] = __builtin_shufflevector(__ret.val[0], __ret.val[0], 1, 0); \ 52300 __ret.val[1] = __builtin_shufflevector(__ret.val[1], __ret.val[1], 1, 0); \ 52301 __ret.val[2] = __builtin_shufflevector(__ret.val[2], __ret.val[2], 1, 0); \ 52302 __ret.val[3] = __builtin_shufflevector(__ret.val[3], __ret.val[3], 1, 0); \ 52303 __ret; \ 52304 }) 52305 #endif 52306 52307 #define vld4_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 52308 uint64x1x4_t __ret; \ 52309 uint64x1x4_t __s1 = __p1; \ 52310 __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 19); \ 52311 __ret; \ 52312 }) 52313 #define vld4_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 52314 float64x1x4_t __ret; \ 52315 float64x1x4_t __s1 = __p1; \ 52316 __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 10); \ 52317 __ret; \ 52318 }) 52319 #define vld4_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 52320 int64x1x4_t __ret; \ 52321 int64x1x4_t __s1 = __p1; \ 52322 __builtin_neon_vld4_lane_v(&__ret, __p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 3); \ 52323 __ret; \ 52324 }) 52325 #define vldrq_p128(__p0) __extension__ ({ \ 52326 poly128_t __ret; \ 52327 __ret = (poly128_t) __builtin_neon_vldrq_p128(__p0); \ 52328 __ret; \ 52329 }) 52330 #ifdef __LITTLE_ENDIAN__ 52331 __ai __attribute__((target("neon"))) float64x2_t vmaxq_f64(float64x2_t __p0, float64x2_t __p1) { 52332 float64x2_t __ret; 52333 __ret = (float64x2_t) __builtin_neon_vmaxq_v((int8x16_t)__p0, (int8x16_t)__p1, 42); 52334 return __ret; 52335 } 52336 #else 52337 __ai __attribute__((target("neon"))) float64x2_t vmaxq_f64(float64x2_t __p0, float64x2_t __p1) { 52338 float64x2_t __ret; 52339 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 52340 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 52341 __ret = (float64x2_t) __builtin_neon_vmaxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 42); 52342 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 52343 return __ret; 52344 } 52345 #endif 52346 52347 __ai __attribute__((target("neon"))) float64x1_t vmax_f64(float64x1_t __p0, float64x1_t __p1) { 52348 float64x1_t __ret; 52349 __ret = (float64x1_t) __builtin_neon_vmax_v((int8x8_t)__p0, (int8x8_t)__p1, 10); 52350 return __ret; 52351 } 52352 #ifdef __LITTLE_ENDIAN__ 52353 __ai __attribute__((target("neon"))) float64_t vmaxnmvq_f64(float64x2_t __p0) { 52354 float64_t __ret; 52355 __ret = (float64_t) __builtin_neon_vmaxnmvq_f64(__p0); 52356 return __ret; 52357 } 52358 #else 52359 __ai __attribute__((target("neon"))) float64_t vmaxnmvq_f64(float64x2_t __p0) { 52360 float64_t __ret; 52361 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 52362 __ret = (float64_t) __builtin_neon_vmaxnmvq_f64(__rev0); 52363 return __ret; 52364 } 52365 #endif 52366 52367 #ifdef __LITTLE_ENDIAN__ 52368 __ai __attribute__((target("neon"))) float32_t vmaxnmvq_f32(float32x4_t __p0) { 52369 float32_t __ret; 52370 __ret = (float32_t) __builtin_neon_vmaxnmvq_f32(__p0); 52371 return __ret; 52372 } 52373 #else 52374 __ai __attribute__((target("neon"))) float32_t vmaxnmvq_f32(float32x4_t __p0) { 52375 float32_t __ret; 52376 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 52377 __ret = (float32_t) __builtin_neon_vmaxnmvq_f32(__rev0); 52378 return __ret; 52379 } 52380 #endif 52381 52382 #ifdef __LITTLE_ENDIAN__ 52383 __ai __attribute__((target("neon"))) float32_t vmaxnmv_f32(float32x2_t __p0) { 52384 float32_t __ret; 52385 __ret = (float32_t) __builtin_neon_vmaxnmv_f32(__p0); 52386 return __ret; 52387 } 52388 #else 52389 __ai __attribute__((target("neon"))) float32_t vmaxnmv_f32(float32x2_t __p0) { 52390 float32_t __ret; 52391 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 52392 __ret = (float32_t) __builtin_neon_vmaxnmv_f32(__rev0); 52393 return __ret; 52394 } 52395 #endif 52396 52397 #ifdef __LITTLE_ENDIAN__ 52398 __ai __attribute__((target("neon"))) uint8_t vmaxvq_u8(uint8x16_t __p0) { 52399 uint8_t __ret; 52400 __ret = (uint8_t) __builtin_neon_vmaxvq_u8(__p0); 52401 return __ret; 52402 } 52403 #else 52404 __ai __attribute__((target("neon"))) uint8_t vmaxvq_u8(uint8x16_t __p0) { 52405 uint8_t __ret; 52406 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 52407 __ret = (uint8_t) __builtin_neon_vmaxvq_u8(__rev0); 52408 return __ret; 52409 } 52410 #endif 52411 52412 #ifdef __LITTLE_ENDIAN__ 52413 __ai __attribute__((target("neon"))) uint32_t vmaxvq_u32(uint32x4_t __p0) { 52414 uint32_t __ret; 52415 __ret = (uint32_t) __builtin_neon_vmaxvq_u32(__p0); 52416 return __ret; 52417 } 52418 #else 52419 __ai __attribute__((target("neon"))) uint32_t vmaxvq_u32(uint32x4_t __p0) { 52420 uint32_t __ret; 52421 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 52422 __ret = (uint32_t) __builtin_neon_vmaxvq_u32(__rev0); 52423 return __ret; 52424 } 52425 #endif 52426 52427 #ifdef __LITTLE_ENDIAN__ 52428 __ai __attribute__((target("neon"))) uint16_t vmaxvq_u16(uint16x8_t __p0) { 52429 uint16_t __ret; 52430 __ret = (uint16_t) __builtin_neon_vmaxvq_u16(__p0); 52431 return __ret; 52432 } 52433 #else 52434 __ai __attribute__((target("neon"))) uint16_t vmaxvq_u16(uint16x8_t __p0) { 52435 uint16_t __ret; 52436 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 52437 __ret = (uint16_t) __builtin_neon_vmaxvq_u16(__rev0); 52438 return __ret; 52439 } 52440 #endif 52441 52442 #ifdef __LITTLE_ENDIAN__ 52443 __ai __attribute__((target("neon"))) int8_t vmaxvq_s8(int8x16_t __p0) { 52444 int8_t __ret; 52445 __ret = (int8_t) __builtin_neon_vmaxvq_s8(__p0); 52446 return __ret; 52447 } 52448 #else 52449 __ai __attribute__((target("neon"))) int8_t vmaxvq_s8(int8x16_t __p0) { 52450 int8_t __ret; 52451 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 52452 __ret = (int8_t) __builtin_neon_vmaxvq_s8(__rev0); 52453 return __ret; 52454 } 52455 #endif 52456 52457 #ifdef __LITTLE_ENDIAN__ 52458 __ai __attribute__((target("neon"))) float64_t vmaxvq_f64(float64x2_t __p0) { 52459 float64_t __ret; 52460 __ret = (float64_t) __builtin_neon_vmaxvq_f64(__p0); 52461 return __ret; 52462 } 52463 #else 52464 __ai __attribute__((target("neon"))) float64_t vmaxvq_f64(float64x2_t __p0) { 52465 float64_t __ret; 52466 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 52467 __ret = (float64_t) __builtin_neon_vmaxvq_f64(__rev0); 52468 return __ret; 52469 } 52470 #endif 52471 52472 #ifdef __LITTLE_ENDIAN__ 52473 __ai __attribute__((target("neon"))) float32_t vmaxvq_f32(float32x4_t __p0) { 52474 float32_t __ret; 52475 __ret = (float32_t) __builtin_neon_vmaxvq_f32(__p0); 52476 return __ret; 52477 } 52478 #else 52479 __ai __attribute__((target("neon"))) float32_t vmaxvq_f32(float32x4_t __p0) { 52480 float32_t __ret; 52481 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 52482 __ret = (float32_t) __builtin_neon_vmaxvq_f32(__rev0); 52483 return __ret; 52484 } 52485 #endif 52486 52487 #ifdef __LITTLE_ENDIAN__ 52488 __ai __attribute__((target("neon"))) int32_t vmaxvq_s32(int32x4_t __p0) { 52489 int32_t __ret; 52490 __ret = (int32_t) __builtin_neon_vmaxvq_s32(__p0); 52491 return __ret; 52492 } 52493 #else 52494 __ai __attribute__((target("neon"))) int32_t vmaxvq_s32(int32x4_t __p0) { 52495 int32_t __ret; 52496 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 52497 __ret = (int32_t) __builtin_neon_vmaxvq_s32(__rev0); 52498 return __ret; 52499 } 52500 #endif 52501 52502 #ifdef __LITTLE_ENDIAN__ 52503 __ai __attribute__((target("neon"))) int16_t vmaxvq_s16(int16x8_t __p0) { 52504 int16_t __ret; 52505 __ret = (int16_t) __builtin_neon_vmaxvq_s16(__p0); 52506 return __ret; 52507 } 52508 #else 52509 __ai __attribute__((target("neon"))) int16_t vmaxvq_s16(int16x8_t __p0) { 52510 int16_t __ret; 52511 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 52512 __ret = (int16_t) __builtin_neon_vmaxvq_s16(__rev0); 52513 return __ret; 52514 } 52515 #endif 52516 52517 #ifdef __LITTLE_ENDIAN__ 52518 __ai __attribute__((target("neon"))) uint8_t vmaxv_u8(uint8x8_t __p0) { 52519 uint8_t __ret; 52520 __ret = (uint8_t) __builtin_neon_vmaxv_u8(__p0); 52521 return __ret; 52522 } 52523 #else 52524 __ai __attribute__((target("neon"))) uint8_t vmaxv_u8(uint8x8_t __p0) { 52525 uint8_t __ret; 52526 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 52527 __ret = (uint8_t) __builtin_neon_vmaxv_u8(__rev0); 52528 return __ret; 52529 } 52530 #endif 52531 52532 #ifdef __LITTLE_ENDIAN__ 52533 __ai __attribute__((target("neon"))) uint32_t vmaxv_u32(uint32x2_t __p0) { 52534 uint32_t __ret; 52535 __ret = (uint32_t) __builtin_neon_vmaxv_u32(__p0); 52536 return __ret; 52537 } 52538 #else 52539 __ai __attribute__((target("neon"))) uint32_t vmaxv_u32(uint32x2_t __p0) { 52540 uint32_t __ret; 52541 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 52542 __ret = (uint32_t) __builtin_neon_vmaxv_u32(__rev0); 52543 return __ret; 52544 } 52545 #endif 52546 52547 #ifdef __LITTLE_ENDIAN__ 52548 __ai __attribute__((target("neon"))) uint16_t vmaxv_u16(uint16x4_t __p0) { 52549 uint16_t __ret; 52550 __ret = (uint16_t) __builtin_neon_vmaxv_u16(__p0); 52551 return __ret; 52552 } 52553 #else 52554 __ai __attribute__((target("neon"))) uint16_t vmaxv_u16(uint16x4_t __p0) { 52555 uint16_t __ret; 52556 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 52557 __ret = (uint16_t) __builtin_neon_vmaxv_u16(__rev0); 52558 return __ret; 52559 } 52560 #endif 52561 52562 #ifdef __LITTLE_ENDIAN__ 52563 __ai __attribute__((target("neon"))) int8_t vmaxv_s8(int8x8_t __p0) { 52564 int8_t __ret; 52565 __ret = (int8_t) __builtin_neon_vmaxv_s8(__p0); 52566 return __ret; 52567 } 52568 #else 52569 __ai __attribute__((target("neon"))) int8_t vmaxv_s8(int8x8_t __p0) { 52570 int8_t __ret; 52571 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 52572 __ret = (int8_t) __builtin_neon_vmaxv_s8(__rev0); 52573 return __ret; 52574 } 52575 #endif 52576 52577 #ifdef __LITTLE_ENDIAN__ 52578 __ai __attribute__((target("neon"))) float32_t vmaxv_f32(float32x2_t __p0) { 52579 float32_t __ret; 52580 __ret = (float32_t) __builtin_neon_vmaxv_f32(__p0); 52581 return __ret; 52582 } 52583 #else 52584 __ai __attribute__((target("neon"))) float32_t vmaxv_f32(float32x2_t __p0) { 52585 float32_t __ret; 52586 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 52587 __ret = (float32_t) __builtin_neon_vmaxv_f32(__rev0); 52588 return __ret; 52589 } 52590 #endif 52591 52592 #ifdef __LITTLE_ENDIAN__ 52593 __ai __attribute__((target("neon"))) int32_t vmaxv_s32(int32x2_t __p0) { 52594 int32_t __ret; 52595 __ret = (int32_t) __builtin_neon_vmaxv_s32(__p0); 52596 return __ret; 52597 } 52598 #else 52599 __ai __attribute__((target("neon"))) int32_t vmaxv_s32(int32x2_t __p0) { 52600 int32_t __ret; 52601 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 52602 __ret = (int32_t) __builtin_neon_vmaxv_s32(__rev0); 52603 return __ret; 52604 } 52605 #endif 52606 52607 #ifdef __LITTLE_ENDIAN__ 52608 __ai __attribute__((target("neon"))) int16_t vmaxv_s16(int16x4_t __p0) { 52609 int16_t __ret; 52610 __ret = (int16_t) __builtin_neon_vmaxv_s16(__p0); 52611 return __ret; 52612 } 52613 #else 52614 __ai __attribute__((target("neon"))) int16_t vmaxv_s16(int16x4_t __p0) { 52615 int16_t __ret; 52616 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 52617 __ret = (int16_t) __builtin_neon_vmaxv_s16(__rev0); 52618 return __ret; 52619 } 52620 #endif 52621 52622 #ifdef __LITTLE_ENDIAN__ 52623 __ai __attribute__((target("neon"))) float64x2_t vminq_f64(float64x2_t __p0, float64x2_t __p1) { 52624 float64x2_t __ret; 52625 __ret = (float64x2_t) __builtin_neon_vminq_v((int8x16_t)__p0, (int8x16_t)__p1, 42); 52626 return __ret; 52627 } 52628 #else 52629 __ai __attribute__((target("neon"))) float64x2_t vminq_f64(float64x2_t __p0, float64x2_t __p1) { 52630 float64x2_t __ret; 52631 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 52632 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 52633 __ret = (float64x2_t) __builtin_neon_vminq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 42); 52634 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 52635 return __ret; 52636 } 52637 #endif 52638 52639 __ai __attribute__((target("neon"))) float64x1_t vmin_f64(float64x1_t __p0, float64x1_t __p1) { 52640 float64x1_t __ret; 52641 __ret = (float64x1_t) __builtin_neon_vmin_v((int8x8_t)__p0, (int8x8_t)__p1, 10); 52642 return __ret; 52643 } 52644 #ifdef __LITTLE_ENDIAN__ 52645 __ai __attribute__((target("neon"))) float64_t vminnmvq_f64(float64x2_t __p0) { 52646 float64_t __ret; 52647 __ret = (float64_t) __builtin_neon_vminnmvq_f64(__p0); 52648 return __ret; 52649 } 52650 #else 52651 __ai __attribute__((target("neon"))) float64_t vminnmvq_f64(float64x2_t __p0) { 52652 float64_t __ret; 52653 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 52654 __ret = (float64_t) __builtin_neon_vminnmvq_f64(__rev0); 52655 return __ret; 52656 } 52657 #endif 52658 52659 #ifdef __LITTLE_ENDIAN__ 52660 __ai __attribute__((target("neon"))) float32_t vminnmvq_f32(float32x4_t __p0) { 52661 float32_t __ret; 52662 __ret = (float32_t) __builtin_neon_vminnmvq_f32(__p0); 52663 return __ret; 52664 } 52665 #else 52666 __ai __attribute__((target("neon"))) float32_t vminnmvq_f32(float32x4_t __p0) { 52667 float32_t __ret; 52668 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 52669 __ret = (float32_t) __builtin_neon_vminnmvq_f32(__rev0); 52670 return __ret; 52671 } 52672 #endif 52673 52674 #ifdef __LITTLE_ENDIAN__ 52675 __ai __attribute__((target("neon"))) float32_t vminnmv_f32(float32x2_t __p0) { 52676 float32_t __ret; 52677 __ret = (float32_t) __builtin_neon_vminnmv_f32(__p0); 52678 return __ret; 52679 } 52680 #else 52681 __ai __attribute__((target("neon"))) float32_t vminnmv_f32(float32x2_t __p0) { 52682 float32_t __ret; 52683 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 52684 __ret = (float32_t) __builtin_neon_vminnmv_f32(__rev0); 52685 return __ret; 52686 } 52687 #endif 52688 52689 #ifdef __LITTLE_ENDIAN__ 52690 __ai __attribute__((target("neon"))) uint8_t vminvq_u8(uint8x16_t __p0) { 52691 uint8_t __ret; 52692 __ret = (uint8_t) __builtin_neon_vminvq_u8(__p0); 52693 return __ret; 52694 } 52695 #else 52696 __ai __attribute__((target("neon"))) uint8_t vminvq_u8(uint8x16_t __p0) { 52697 uint8_t __ret; 52698 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 52699 __ret = (uint8_t) __builtin_neon_vminvq_u8(__rev0); 52700 return __ret; 52701 } 52702 #endif 52703 52704 #ifdef __LITTLE_ENDIAN__ 52705 __ai __attribute__((target("neon"))) uint32_t vminvq_u32(uint32x4_t __p0) { 52706 uint32_t __ret; 52707 __ret = (uint32_t) __builtin_neon_vminvq_u32(__p0); 52708 return __ret; 52709 } 52710 #else 52711 __ai __attribute__((target("neon"))) uint32_t vminvq_u32(uint32x4_t __p0) { 52712 uint32_t __ret; 52713 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 52714 __ret = (uint32_t) __builtin_neon_vminvq_u32(__rev0); 52715 return __ret; 52716 } 52717 #endif 52718 52719 #ifdef __LITTLE_ENDIAN__ 52720 __ai __attribute__((target("neon"))) uint16_t vminvq_u16(uint16x8_t __p0) { 52721 uint16_t __ret; 52722 __ret = (uint16_t) __builtin_neon_vminvq_u16(__p0); 52723 return __ret; 52724 } 52725 #else 52726 __ai __attribute__((target("neon"))) uint16_t vminvq_u16(uint16x8_t __p0) { 52727 uint16_t __ret; 52728 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 52729 __ret = (uint16_t) __builtin_neon_vminvq_u16(__rev0); 52730 return __ret; 52731 } 52732 #endif 52733 52734 #ifdef __LITTLE_ENDIAN__ 52735 __ai __attribute__((target("neon"))) int8_t vminvq_s8(int8x16_t __p0) { 52736 int8_t __ret; 52737 __ret = (int8_t) __builtin_neon_vminvq_s8(__p0); 52738 return __ret; 52739 } 52740 #else 52741 __ai __attribute__((target("neon"))) int8_t vminvq_s8(int8x16_t __p0) { 52742 int8_t __ret; 52743 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 52744 __ret = (int8_t) __builtin_neon_vminvq_s8(__rev0); 52745 return __ret; 52746 } 52747 #endif 52748 52749 #ifdef __LITTLE_ENDIAN__ 52750 __ai __attribute__((target("neon"))) float64_t vminvq_f64(float64x2_t __p0) { 52751 float64_t __ret; 52752 __ret = (float64_t) __builtin_neon_vminvq_f64(__p0); 52753 return __ret; 52754 } 52755 #else 52756 __ai __attribute__((target("neon"))) float64_t vminvq_f64(float64x2_t __p0) { 52757 float64_t __ret; 52758 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 52759 __ret = (float64_t) __builtin_neon_vminvq_f64(__rev0); 52760 return __ret; 52761 } 52762 #endif 52763 52764 #ifdef __LITTLE_ENDIAN__ 52765 __ai __attribute__((target("neon"))) float32_t vminvq_f32(float32x4_t __p0) { 52766 float32_t __ret; 52767 __ret = (float32_t) __builtin_neon_vminvq_f32(__p0); 52768 return __ret; 52769 } 52770 #else 52771 __ai __attribute__((target("neon"))) float32_t vminvq_f32(float32x4_t __p0) { 52772 float32_t __ret; 52773 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 52774 __ret = (float32_t) __builtin_neon_vminvq_f32(__rev0); 52775 return __ret; 52776 } 52777 #endif 52778 52779 #ifdef __LITTLE_ENDIAN__ 52780 __ai __attribute__((target("neon"))) int32_t vminvq_s32(int32x4_t __p0) { 52781 int32_t __ret; 52782 __ret = (int32_t) __builtin_neon_vminvq_s32(__p0); 52783 return __ret; 52784 } 52785 #else 52786 __ai __attribute__((target("neon"))) int32_t vminvq_s32(int32x4_t __p0) { 52787 int32_t __ret; 52788 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 52789 __ret = (int32_t) __builtin_neon_vminvq_s32(__rev0); 52790 return __ret; 52791 } 52792 #endif 52793 52794 #ifdef __LITTLE_ENDIAN__ 52795 __ai __attribute__((target("neon"))) int16_t vminvq_s16(int16x8_t __p0) { 52796 int16_t __ret; 52797 __ret = (int16_t) __builtin_neon_vminvq_s16(__p0); 52798 return __ret; 52799 } 52800 #else 52801 __ai __attribute__((target("neon"))) int16_t vminvq_s16(int16x8_t __p0) { 52802 int16_t __ret; 52803 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 52804 __ret = (int16_t) __builtin_neon_vminvq_s16(__rev0); 52805 return __ret; 52806 } 52807 #endif 52808 52809 #ifdef __LITTLE_ENDIAN__ 52810 __ai __attribute__((target("neon"))) uint8_t vminv_u8(uint8x8_t __p0) { 52811 uint8_t __ret; 52812 __ret = (uint8_t) __builtin_neon_vminv_u8(__p0); 52813 return __ret; 52814 } 52815 #else 52816 __ai __attribute__((target("neon"))) uint8_t vminv_u8(uint8x8_t __p0) { 52817 uint8_t __ret; 52818 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 52819 __ret = (uint8_t) __builtin_neon_vminv_u8(__rev0); 52820 return __ret; 52821 } 52822 #endif 52823 52824 #ifdef __LITTLE_ENDIAN__ 52825 __ai __attribute__((target("neon"))) uint32_t vminv_u32(uint32x2_t __p0) { 52826 uint32_t __ret; 52827 __ret = (uint32_t) __builtin_neon_vminv_u32(__p0); 52828 return __ret; 52829 } 52830 #else 52831 __ai __attribute__((target("neon"))) uint32_t vminv_u32(uint32x2_t __p0) { 52832 uint32_t __ret; 52833 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 52834 __ret = (uint32_t) __builtin_neon_vminv_u32(__rev0); 52835 return __ret; 52836 } 52837 #endif 52838 52839 #ifdef __LITTLE_ENDIAN__ 52840 __ai __attribute__((target("neon"))) uint16_t vminv_u16(uint16x4_t __p0) { 52841 uint16_t __ret; 52842 __ret = (uint16_t) __builtin_neon_vminv_u16(__p0); 52843 return __ret; 52844 } 52845 #else 52846 __ai __attribute__((target("neon"))) uint16_t vminv_u16(uint16x4_t __p0) { 52847 uint16_t __ret; 52848 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 52849 __ret = (uint16_t) __builtin_neon_vminv_u16(__rev0); 52850 return __ret; 52851 } 52852 #endif 52853 52854 #ifdef __LITTLE_ENDIAN__ 52855 __ai __attribute__((target("neon"))) int8_t vminv_s8(int8x8_t __p0) { 52856 int8_t __ret; 52857 __ret = (int8_t) __builtin_neon_vminv_s8(__p0); 52858 return __ret; 52859 } 52860 #else 52861 __ai __attribute__((target("neon"))) int8_t vminv_s8(int8x8_t __p0) { 52862 int8_t __ret; 52863 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 52864 __ret = (int8_t) __builtin_neon_vminv_s8(__rev0); 52865 return __ret; 52866 } 52867 #endif 52868 52869 #ifdef __LITTLE_ENDIAN__ 52870 __ai __attribute__((target("neon"))) float32_t vminv_f32(float32x2_t __p0) { 52871 float32_t __ret; 52872 __ret = (float32_t) __builtin_neon_vminv_f32(__p0); 52873 return __ret; 52874 } 52875 #else 52876 __ai __attribute__((target("neon"))) float32_t vminv_f32(float32x2_t __p0) { 52877 float32_t __ret; 52878 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 52879 __ret = (float32_t) __builtin_neon_vminv_f32(__rev0); 52880 return __ret; 52881 } 52882 #endif 52883 52884 #ifdef __LITTLE_ENDIAN__ 52885 __ai __attribute__((target("neon"))) int32_t vminv_s32(int32x2_t __p0) { 52886 int32_t __ret; 52887 __ret = (int32_t) __builtin_neon_vminv_s32(__p0); 52888 return __ret; 52889 } 52890 #else 52891 __ai __attribute__((target("neon"))) int32_t vminv_s32(int32x2_t __p0) { 52892 int32_t __ret; 52893 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 52894 __ret = (int32_t) __builtin_neon_vminv_s32(__rev0); 52895 return __ret; 52896 } 52897 #endif 52898 52899 #ifdef __LITTLE_ENDIAN__ 52900 __ai __attribute__((target("neon"))) int16_t vminv_s16(int16x4_t __p0) { 52901 int16_t __ret; 52902 __ret = (int16_t) __builtin_neon_vminv_s16(__p0); 52903 return __ret; 52904 } 52905 #else 52906 __ai __attribute__((target("neon"))) int16_t vminv_s16(int16x4_t __p0) { 52907 int16_t __ret; 52908 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 52909 __ret = (int16_t) __builtin_neon_vminv_s16(__rev0); 52910 return __ret; 52911 } 52912 #endif 52913 52914 #ifdef __LITTLE_ENDIAN__ 52915 __ai __attribute__((target("neon"))) float64x2_t vmlaq_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) { 52916 float64x2_t __ret; 52917 __ret = __p0 + __p1 * __p2; 52918 return __ret; 52919 } 52920 #else 52921 __ai __attribute__((target("neon"))) float64x2_t vmlaq_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) { 52922 float64x2_t __ret; 52923 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 52924 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 52925 float64x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 52926 __ret = __rev0 + __rev1 * __rev2; 52927 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 52928 return __ret; 52929 } 52930 #endif 52931 52932 __ai __attribute__((target("neon"))) float64x1_t vmla_f64(float64x1_t __p0, float64x1_t __p1, float64x1_t __p2) { 52933 float64x1_t __ret; 52934 __ret = __p0 + __p1 * __p2; 52935 return __ret; 52936 } 52937 #ifdef __LITTLE_ENDIAN__ 52938 #define vmlaq_laneq_u32(__p0_448, __p1_448, __p2_448, __p3_448) __extension__ ({ \ 52939 uint32x4_t __ret_448; \ 52940 uint32x4_t __s0_448 = __p0_448; \ 52941 uint32x4_t __s1_448 = __p1_448; \ 52942 uint32x4_t __s2_448 = __p2_448; \ 52943 __ret_448 = __s0_448 + __s1_448 * splatq_laneq_u32(__s2_448, __p3_448); \ 52944 __ret_448; \ 52945 }) 52946 #else 52947 #define vmlaq_laneq_u32(__p0_449, __p1_449, __p2_449, __p3_449) __extension__ ({ \ 52948 uint32x4_t __ret_449; \ 52949 uint32x4_t __s0_449 = __p0_449; \ 52950 uint32x4_t __s1_449 = __p1_449; \ 52951 uint32x4_t __s2_449 = __p2_449; \ 52952 uint32x4_t __rev0_449; __rev0_449 = __builtin_shufflevector(__s0_449, __s0_449, 3, 2, 1, 0); \ 52953 uint32x4_t __rev1_449; __rev1_449 = __builtin_shufflevector(__s1_449, __s1_449, 3, 2, 1, 0); \ 52954 uint32x4_t __rev2_449; __rev2_449 = __builtin_shufflevector(__s2_449, __s2_449, 3, 2, 1, 0); \ 52955 __ret_449 = __rev0_449 + __rev1_449 * __noswap_splatq_laneq_u32(__rev2_449, __p3_449); \ 52956 __ret_449 = __builtin_shufflevector(__ret_449, __ret_449, 3, 2, 1, 0); \ 52957 __ret_449; \ 52958 }) 52959 #endif 52960 52961 #ifdef __LITTLE_ENDIAN__ 52962 #define vmlaq_laneq_u16(__p0_450, __p1_450, __p2_450, __p3_450) __extension__ ({ \ 52963 uint16x8_t __ret_450; \ 52964 uint16x8_t __s0_450 = __p0_450; \ 52965 uint16x8_t __s1_450 = __p1_450; \ 52966 uint16x8_t __s2_450 = __p2_450; \ 52967 __ret_450 = __s0_450 + __s1_450 * splatq_laneq_u16(__s2_450, __p3_450); \ 52968 __ret_450; \ 52969 }) 52970 #else 52971 #define vmlaq_laneq_u16(__p0_451, __p1_451, __p2_451, __p3_451) __extension__ ({ \ 52972 uint16x8_t __ret_451; \ 52973 uint16x8_t __s0_451 = __p0_451; \ 52974 uint16x8_t __s1_451 = __p1_451; \ 52975 uint16x8_t __s2_451 = __p2_451; \ 52976 uint16x8_t __rev0_451; __rev0_451 = __builtin_shufflevector(__s0_451, __s0_451, 7, 6, 5, 4, 3, 2, 1, 0); \ 52977 uint16x8_t __rev1_451; __rev1_451 = __builtin_shufflevector(__s1_451, __s1_451, 7, 6, 5, 4, 3, 2, 1, 0); \ 52978 uint16x8_t __rev2_451; __rev2_451 = __builtin_shufflevector(__s2_451, __s2_451, 7, 6, 5, 4, 3, 2, 1, 0); \ 52979 __ret_451 = __rev0_451 + __rev1_451 * __noswap_splatq_laneq_u16(__rev2_451, __p3_451); \ 52980 __ret_451 = __builtin_shufflevector(__ret_451, __ret_451, 7, 6, 5, 4, 3, 2, 1, 0); \ 52981 __ret_451; \ 52982 }) 52983 #endif 52984 52985 #ifdef __LITTLE_ENDIAN__ 52986 #define vmlaq_laneq_f32(__p0_452, __p1_452, __p2_452, __p3_452) __extension__ ({ \ 52987 float32x4_t __ret_452; \ 52988 float32x4_t __s0_452 = __p0_452; \ 52989 float32x4_t __s1_452 = __p1_452; \ 52990 float32x4_t __s2_452 = __p2_452; \ 52991 __ret_452 = __s0_452 + __s1_452 * splatq_laneq_f32(__s2_452, __p3_452); \ 52992 __ret_452; \ 52993 }) 52994 #else 52995 #define vmlaq_laneq_f32(__p0_453, __p1_453, __p2_453, __p3_453) __extension__ ({ \ 52996 float32x4_t __ret_453; \ 52997 float32x4_t __s0_453 = __p0_453; \ 52998 float32x4_t __s1_453 = __p1_453; \ 52999 float32x4_t __s2_453 = __p2_453; \ 53000 float32x4_t __rev0_453; __rev0_453 = __builtin_shufflevector(__s0_453, __s0_453, 3, 2, 1, 0); \ 53001 float32x4_t __rev1_453; __rev1_453 = __builtin_shufflevector(__s1_453, __s1_453, 3, 2, 1, 0); \ 53002 float32x4_t __rev2_453; __rev2_453 = __builtin_shufflevector(__s2_453, __s2_453, 3, 2, 1, 0); \ 53003 __ret_453 = __rev0_453 + __rev1_453 * __noswap_splatq_laneq_f32(__rev2_453, __p3_453); \ 53004 __ret_453 = __builtin_shufflevector(__ret_453, __ret_453, 3, 2, 1, 0); \ 53005 __ret_453; \ 53006 }) 53007 #endif 53008 53009 #ifdef __LITTLE_ENDIAN__ 53010 #define vmlaq_laneq_s32(__p0_454, __p1_454, __p2_454, __p3_454) __extension__ ({ \ 53011 int32x4_t __ret_454; \ 53012 int32x4_t __s0_454 = __p0_454; \ 53013 int32x4_t __s1_454 = __p1_454; \ 53014 int32x4_t __s2_454 = __p2_454; \ 53015 __ret_454 = __s0_454 + __s1_454 * splatq_laneq_s32(__s2_454, __p3_454); \ 53016 __ret_454; \ 53017 }) 53018 #else 53019 #define vmlaq_laneq_s32(__p0_455, __p1_455, __p2_455, __p3_455) __extension__ ({ \ 53020 int32x4_t __ret_455; \ 53021 int32x4_t __s0_455 = __p0_455; \ 53022 int32x4_t __s1_455 = __p1_455; \ 53023 int32x4_t __s2_455 = __p2_455; \ 53024 int32x4_t __rev0_455; __rev0_455 = __builtin_shufflevector(__s0_455, __s0_455, 3, 2, 1, 0); \ 53025 int32x4_t __rev1_455; __rev1_455 = __builtin_shufflevector(__s1_455, __s1_455, 3, 2, 1, 0); \ 53026 int32x4_t __rev2_455; __rev2_455 = __builtin_shufflevector(__s2_455, __s2_455, 3, 2, 1, 0); \ 53027 __ret_455 = __rev0_455 + __rev1_455 * __noswap_splatq_laneq_s32(__rev2_455, __p3_455); \ 53028 __ret_455 = __builtin_shufflevector(__ret_455, __ret_455, 3, 2, 1, 0); \ 53029 __ret_455; \ 53030 }) 53031 #endif 53032 53033 #ifdef __LITTLE_ENDIAN__ 53034 #define vmlaq_laneq_s16(__p0_456, __p1_456, __p2_456, __p3_456) __extension__ ({ \ 53035 int16x8_t __ret_456; \ 53036 int16x8_t __s0_456 = __p0_456; \ 53037 int16x8_t __s1_456 = __p1_456; \ 53038 int16x8_t __s2_456 = __p2_456; \ 53039 __ret_456 = __s0_456 + __s1_456 * splatq_laneq_s16(__s2_456, __p3_456); \ 53040 __ret_456; \ 53041 }) 53042 #else 53043 #define vmlaq_laneq_s16(__p0_457, __p1_457, __p2_457, __p3_457) __extension__ ({ \ 53044 int16x8_t __ret_457; \ 53045 int16x8_t __s0_457 = __p0_457; \ 53046 int16x8_t __s1_457 = __p1_457; \ 53047 int16x8_t __s2_457 = __p2_457; \ 53048 int16x8_t __rev0_457; __rev0_457 = __builtin_shufflevector(__s0_457, __s0_457, 7, 6, 5, 4, 3, 2, 1, 0); \ 53049 int16x8_t __rev1_457; __rev1_457 = __builtin_shufflevector(__s1_457, __s1_457, 7, 6, 5, 4, 3, 2, 1, 0); \ 53050 int16x8_t __rev2_457; __rev2_457 = __builtin_shufflevector(__s2_457, __s2_457, 7, 6, 5, 4, 3, 2, 1, 0); \ 53051 __ret_457 = __rev0_457 + __rev1_457 * __noswap_splatq_laneq_s16(__rev2_457, __p3_457); \ 53052 __ret_457 = __builtin_shufflevector(__ret_457, __ret_457, 7, 6, 5, 4, 3, 2, 1, 0); \ 53053 __ret_457; \ 53054 }) 53055 #endif 53056 53057 #ifdef __LITTLE_ENDIAN__ 53058 #define vmla_laneq_u32(__p0_458, __p1_458, __p2_458, __p3_458) __extension__ ({ \ 53059 uint32x2_t __ret_458; \ 53060 uint32x2_t __s0_458 = __p0_458; \ 53061 uint32x2_t __s1_458 = __p1_458; \ 53062 uint32x4_t __s2_458 = __p2_458; \ 53063 __ret_458 = __s0_458 + __s1_458 * splat_laneq_u32(__s2_458, __p3_458); \ 53064 __ret_458; \ 53065 }) 53066 #else 53067 #define vmla_laneq_u32(__p0_459, __p1_459, __p2_459, __p3_459) __extension__ ({ \ 53068 uint32x2_t __ret_459; \ 53069 uint32x2_t __s0_459 = __p0_459; \ 53070 uint32x2_t __s1_459 = __p1_459; \ 53071 uint32x4_t __s2_459 = __p2_459; \ 53072 uint32x2_t __rev0_459; __rev0_459 = __builtin_shufflevector(__s0_459, __s0_459, 1, 0); \ 53073 uint32x2_t __rev1_459; __rev1_459 = __builtin_shufflevector(__s1_459, __s1_459, 1, 0); \ 53074 uint32x4_t __rev2_459; __rev2_459 = __builtin_shufflevector(__s2_459, __s2_459, 3, 2, 1, 0); \ 53075 __ret_459 = __rev0_459 + __rev1_459 * __noswap_splat_laneq_u32(__rev2_459, __p3_459); \ 53076 __ret_459 = __builtin_shufflevector(__ret_459, __ret_459, 1, 0); \ 53077 __ret_459; \ 53078 }) 53079 #endif 53080 53081 #ifdef __LITTLE_ENDIAN__ 53082 #define vmla_laneq_u16(__p0_460, __p1_460, __p2_460, __p3_460) __extension__ ({ \ 53083 uint16x4_t __ret_460; \ 53084 uint16x4_t __s0_460 = __p0_460; \ 53085 uint16x4_t __s1_460 = __p1_460; \ 53086 uint16x8_t __s2_460 = __p2_460; \ 53087 __ret_460 = __s0_460 + __s1_460 * splat_laneq_u16(__s2_460, __p3_460); \ 53088 __ret_460; \ 53089 }) 53090 #else 53091 #define vmla_laneq_u16(__p0_461, __p1_461, __p2_461, __p3_461) __extension__ ({ \ 53092 uint16x4_t __ret_461; \ 53093 uint16x4_t __s0_461 = __p0_461; \ 53094 uint16x4_t __s1_461 = __p1_461; \ 53095 uint16x8_t __s2_461 = __p2_461; \ 53096 uint16x4_t __rev0_461; __rev0_461 = __builtin_shufflevector(__s0_461, __s0_461, 3, 2, 1, 0); \ 53097 uint16x4_t __rev1_461; __rev1_461 = __builtin_shufflevector(__s1_461, __s1_461, 3, 2, 1, 0); \ 53098 uint16x8_t __rev2_461; __rev2_461 = __builtin_shufflevector(__s2_461, __s2_461, 7, 6, 5, 4, 3, 2, 1, 0); \ 53099 __ret_461 = __rev0_461 + __rev1_461 * __noswap_splat_laneq_u16(__rev2_461, __p3_461); \ 53100 __ret_461 = __builtin_shufflevector(__ret_461, __ret_461, 3, 2, 1, 0); \ 53101 __ret_461; \ 53102 }) 53103 #endif 53104 53105 #ifdef __LITTLE_ENDIAN__ 53106 #define vmla_laneq_f32(__p0_462, __p1_462, __p2_462, __p3_462) __extension__ ({ \ 53107 float32x2_t __ret_462; \ 53108 float32x2_t __s0_462 = __p0_462; \ 53109 float32x2_t __s1_462 = __p1_462; \ 53110 float32x4_t __s2_462 = __p2_462; \ 53111 __ret_462 = __s0_462 + __s1_462 * splat_laneq_f32(__s2_462, __p3_462); \ 53112 __ret_462; \ 53113 }) 53114 #else 53115 #define vmla_laneq_f32(__p0_463, __p1_463, __p2_463, __p3_463) __extension__ ({ \ 53116 float32x2_t __ret_463; \ 53117 float32x2_t __s0_463 = __p0_463; \ 53118 float32x2_t __s1_463 = __p1_463; \ 53119 float32x4_t __s2_463 = __p2_463; \ 53120 float32x2_t __rev0_463; __rev0_463 = __builtin_shufflevector(__s0_463, __s0_463, 1, 0); \ 53121 float32x2_t __rev1_463; __rev1_463 = __builtin_shufflevector(__s1_463, __s1_463, 1, 0); \ 53122 float32x4_t __rev2_463; __rev2_463 = __builtin_shufflevector(__s2_463, __s2_463, 3, 2, 1, 0); \ 53123 __ret_463 = __rev0_463 + __rev1_463 * __noswap_splat_laneq_f32(__rev2_463, __p3_463); \ 53124 __ret_463 = __builtin_shufflevector(__ret_463, __ret_463, 1, 0); \ 53125 __ret_463; \ 53126 }) 53127 #endif 53128 53129 #ifdef __LITTLE_ENDIAN__ 53130 #define vmla_laneq_s32(__p0_464, __p1_464, __p2_464, __p3_464) __extension__ ({ \ 53131 int32x2_t __ret_464; \ 53132 int32x2_t __s0_464 = __p0_464; \ 53133 int32x2_t __s1_464 = __p1_464; \ 53134 int32x4_t __s2_464 = __p2_464; \ 53135 __ret_464 = __s0_464 + __s1_464 * splat_laneq_s32(__s2_464, __p3_464); \ 53136 __ret_464; \ 53137 }) 53138 #else 53139 #define vmla_laneq_s32(__p0_465, __p1_465, __p2_465, __p3_465) __extension__ ({ \ 53140 int32x2_t __ret_465; \ 53141 int32x2_t __s0_465 = __p0_465; \ 53142 int32x2_t __s1_465 = __p1_465; \ 53143 int32x4_t __s2_465 = __p2_465; \ 53144 int32x2_t __rev0_465; __rev0_465 = __builtin_shufflevector(__s0_465, __s0_465, 1, 0); \ 53145 int32x2_t __rev1_465; __rev1_465 = __builtin_shufflevector(__s1_465, __s1_465, 1, 0); \ 53146 int32x4_t __rev2_465; __rev2_465 = __builtin_shufflevector(__s2_465, __s2_465, 3, 2, 1, 0); \ 53147 __ret_465 = __rev0_465 + __rev1_465 * __noswap_splat_laneq_s32(__rev2_465, __p3_465); \ 53148 __ret_465 = __builtin_shufflevector(__ret_465, __ret_465, 1, 0); \ 53149 __ret_465; \ 53150 }) 53151 #endif 53152 53153 #ifdef __LITTLE_ENDIAN__ 53154 #define vmla_laneq_s16(__p0_466, __p1_466, __p2_466, __p3_466) __extension__ ({ \ 53155 int16x4_t __ret_466; \ 53156 int16x4_t __s0_466 = __p0_466; \ 53157 int16x4_t __s1_466 = __p1_466; \ 53158 int16x8_t __s2_466 = __p2_466; \ 53159 __ret_466 = __s0_466 + __s1_466 * splat_laneq_s16(__s2_466, __p3_466); \ 53160 __ret_466; \ 53161 }) 53162 #else 53163 #define vmla_laneq_s16(__p0_467, __p1_467, __p2_467, __p3_467) __extension__ ({ \ 53164 int16x4_t __ret_467; \ 53165 int16x4_t __s0_467 = __p0_467; \ 53166 int16x4_t __s1_467 = __p1_467; \ 53167 int16x8_t __s2_467 = __p2_467; \ 53168 int16x4_t __rev0_467; __rev0_467 = __builtin_shufflevector(__s0_467, __s0_467, 3, 2, 1, 0); \ 53169 int16x4_t __rev1_467; __rev1_467 = __builtin_shufflevector(__s1_467, __s1_467, 3, 2, 1, 0); \ 53170 int16x8_t __rev2_467; __rev2_467 = __builtin_shufflevector(__s2_467, __s2_467, 7, 6, 5, 4, 3, 2, 1, 0); \ 53171 __ret_467 = __rev0_467 + __rev1_467 * __noswap_splat_laneq_s16(__rev2_467, __p3_467); \ 53172 __ret_467 = __builtin_shufflevector(__ret_467, __ret_467, 3, 2, 1, 0); \ 53173 __ret_467; \ 53174 }) 53175 #endif 53176 53177 #ifdef __LITTLE_ENDIAN__ 53178 #define vmlal_high_lane_u32(__p0_468, __p1_468, __p2_468, __p3_468) __extension__ ({ \ 53179 uint64x2_t __ret_468; \ 53180 uint64x2_t __s0_468 = __p0_468; \ 53181 uint32x4_t __s1_468 = __p1_468; \ 53182 uint32x2_t __s2_468 = __p2_468; \ 53183 __ret_468 = __s0_468 + vmull_u32(vget_high_u32(__s1_468), splat_lane_u32(__s2_468, __p3_468)); \ 53184 __ret_468; \ 53185 }) 53186 #else 53187 #define vmlal_high_lane_u32(__p0_469, __p1_469, __p2_469, __p3_469) __extension__ ({ \ 53188 uint64x2_t __ret_469; \ 53189 uint64x2_t __s0_469 = __p0_469; \ 53190 uint32x4_t __s1_469 = __p1_469; \ 53191 uint32x2_t __s2_469 = __p2_469; \ 53192 uint64x2_t __rev0_469; __rev0_469 = __builtin_shufflevector(__s0_469, __s0_469, 1, 0); \ 53193 uint32x4_t __rev1_469; __rev1_469 = __builtin_shufflevector(__s1_469, __s1_469, 3, 2, 1, 0); \ 53194 uint32x2_t __rev2_469; __rev2_469 = __builtin_shufflevector(__s2_469, __s2_469, 1, 0); \ 53195 __ret_469 = __rev0_469 + __noswap_vmull_u32(__noswap_vget_high_u32(__rev1_469), __noswap_splat_lane_u32(__rev2_469, __p3_469)); \ 53196 __ret_469 = __builtin_shufflevector(__ret_469, __ret_469, 1, 0); \ 53197 __ret_469; \ 53198 }) 53199 #endif 53200 53201 #ifdef __LITTLE_ENDIAN__ 53202 #define vmlal_high_lane_u16(__p0_470, __p1_470, __p2_470, __p3_470) __extension__ ({ \ 53203 uint32x4_t __ret_470; \ 53204 uint32x4_t __s0_470 = __p0_470; \ 53205 uint16x8_t __s1_470 = __p1_470; \ 53206 uint16x4_t __s2_470 = __p2_470; \ 53207 __ret_470 = __s0_470 + vmull_u16(vget_high_u16(__s1_470), splat_lane_u16(__s2_470, __p3_470)); \ 53208 __ret_470; \ 53209 }) 53210 #else 53211 #define vmlal_high_lane_u16(__p0_471, __p1_471, __p2_471, __p3_471) __extension__ ({ \ 53212 uint32x4_t __ret_471; \ 53213 uint32x4_t __s0_471 = __p0_471; \ 53214 uint16x8_t __s1_471 = __p1_471; \ 53215 uint16x4_t __s2_471 = __p2_471; \ 53216 uint32x4_t __rev0_471; __rev0_471 = __builtin_shufflevector(__s0_471, __s0_471, 3, 2, 1, 0); \ 53217 uint16x8_t __rev1_471; __rev1_471 = __builtin_shufflevector(__s1_471, __s1_471, 7, 6, 5, 4, 3, 2, 1, 0); \ 53218 uint16x4_t __rev2_471; __rev2_471 = __builtin_shufflevector(__s2_471, __s2_471, 3, 2, 1, 0); \ 53219 __ret_471 = __rev0_471 + __noswap_vmull_u16(__noswap_vget_high_u16(__rev1_471), __noswap_splat_lane_u16(__rev2_471, __p3_471)); \ 53220 __ret_471 = __builtin_shufflevector(__ret_471, __ret_471, 3, 2, 1, 0); \ 53221 __ret_471; \ 53222 }) 53223 #endif 53224 53225 #ifdef __LITTLE_ENDIAN__ 53226 #define vmlal_high_lane_s32(__p0_472, __p1_472, __p2_472, __p3_472) __extension__ ({ \ 53227 int64x2_t __ret_472; \ 53228 int64x2_t __s0_472 = __p0_472; \ 53229 int32x4_t __s1_472 = __p1_472; \ 53230 int32x2_t __s2_472 = __p2_472; \ 53231 __ret_472 = __s0_472 + vmull_s32(vget_high_s32(__s1_472), splat_lane_s32(__s2_472, __p3_472)); \ 53232 __ret_472; \ 53233 }) 53234 #else 53235 #define vmlal_high_lane_s32(__p0_473, __p1_473, __p2_473, __p3_473) __extension__ ({ \ 53236 int64x2_t __ret_473; \ 53237 int64x2_t __s0_473 = __p0_473; \ 53238 int32x4_t __s1_473 = __p1_473; \ 53239 int32x2_t __s2_473 = __p2_473; \ 53240 int64x2_t __rev0_473; __rev0_473 = __builtin_shufflevector(__s0_473, __s0_473, 1, 0); \ 53241 int32x4_t __rev1_473; __rev1_473 = __builtin_shufflevector(__s1_473, __s1_473, 3, 2, 1, 0); \ 53242 int32x2_t __rev2_473; __rev2_473 = __builtin_shufflevector(__s2_473, __s2_473, 1, 0); \ 53243 __ret_473 = __rev0_473 + __noswap_vmull_s32(__noswap_vget_high_s32(__rev1_473), __noswap_splat_lane_s32(__rev2_473, __p3_473)); \ 53244 __ret_473 = __builtin_shufflevector(__ret_473, __ret_473, 1, 0); \ 53245 __ret_473; \ 53246 }) 53247 #endif 53248 53249 #ifdef __LITTLE_ENDIAN__ 53250 #define vmlal_high_lane_s16(__p0_474, __p1_474, __p2_474, __p3_474) __extension__ ({ \ 53251 int32x4_t __ret_474; \ 53252 int32x4_t __s0_474 = __p0_474; \ 53253 int16x8_t __s1_474 = __p1_474; \ 53254 int16x4_t __s2_474 = __p2_474; \ 53255 __ret_474 = __s0_474 + vmull_s16(vget_high_s16(__s1_474), splat_lane_s16(__s2_474, __p3_474)); \ 53256 __ret_474; \ 53257 }) 53258 #else 53259 #define vmlal_high_lane_s16(__p0_475, __p1_475, __p2_475, __p3_475) __extension__ ({ \ 53260 int32x4_t __ret_475; \ 53261 int32x4_t __s0_475 = __p0_475; \ 53262 int16x8_t __s1_475 = __p1_475; \ 53263 int16x4_t __s2_475 = __p2_475; \ 53264 int32x4_t __rev0_475; __rev0_475 = __builtin_shufflevector(__s0_475, __s0_475, 3, 2, 1, 0); \ 53265 int16x8_t __rev1_475; __rev1_475 = __builtin_shufflevector(__s1_475, __s1_475, 7, 6, 5, 4, 3, 2, 1, 0); \ 53266 int16x4_t __rev2_475; __rev2_475 = __builtin_shufflevector(__s2_475, __s2_475, 3, 2, 1, 0); \ 53267 __ret_475 = __rev0_475 + __noswap_vmull_s16(__noswap_vget_high_s16(__rev1_475), __noswap_splat_lane_s16(__rev2_475, __p3_475)); \ 53268 __ret_475 = __builtin_shufflevector(__ret_475, __ret_475, 3, 2, 1, 0); \ 53269 __ret_475; \ 53270 }) 53271 #endif 53272 53273 #ifdef __LITTLE_ENDIAN__ 53274 #define vmlal_high_laneq_u32(__p0_476, __p1_476, __p2_476, __p3_476) __extension__ ({ \ 53275 uint64x2_t __ret_476; \ 53276 uint64x2_t __s0_476 = __p0_476; \ 53277 uint32x4_t __s1_476 = __p1_476; \ 53278 uint32x4_t __s2_476 = __p2_476; \ 53279 __ret_476 = __s0_476 + vmull_u32(vget_high_u32(__s1_476), splat_laneq_u32(__s2_476, __p3_476)); \ 53280 __ret_476; \ 53281 }) 53282 #else 53283 #define vmlal_high_laneq_u32(__p0_477, __p1_477, __p2_477, __p3_477) __extension__ ({ \ 53284 uint64x2_t __ret_477; \ 53285 uint64x2_t __s0_477 = __p0_477; \ 53286 uint32x4_t __s1_477 = __p1_477; \ 53287 uint32x4_t __s2_477 = __p2_477; \ 53288 uint64x2_t __rev0_477; __rev0_477 = __builtin_shufflevector(__s0_477, __s0_477, 1, 0); \ 53289 uint32x4_t __rev1_477; __rev1_477 = __builtin_shufflevector(__s1_477, __s1_477, 3, 2, 1, 0); \ 53290 uint32x4_t __rev2_477; __rev2_477 = __builtin_shufflevector(__s2_477, __s2_477, 3, 2, 1, 0); \ 53291 __ret_477 = __rev0_477 + __noswap_vmull_u32(__noswap_vget_high_u32(__rev1_477), __noswap_splat_laneq_u32(__rev2_477, __p3_477)); \ 53292 __ret_477 = __builtin_shufflevector(__ret_477, __ret_477, 1, 0); \ 53293 __ret_477; \ 53294 }) 53295 #endif 53296 53297 #ifdef __LITTLE_ENDIAN__ 53298 #define vmlal_high_laneq_u16(__p0_478, __p1_478, __p2_478, __p3_478) __extension__ ({ \ 53299 uint32x4_t __ret_478; \ 53300 uint32x4_t __s0_478 = __p0_478; \ 53301 uint16x8_t __s1_478 = __p1_478; \ 53302 uint16x8_t __s2_478 = __p2_478; \ 53303 __ret_478 = __s0_478 + vmull_u16(vget_high_u16(__s1_478), splat_laneq_u16(__s2_478, __p3_478)); \ 53304 __ret_478; \ 53305 }) 53306 #else 53307 #define vmlal_high_laneq_u16(__p0_479, __p1_479, __p2_479, __p3_479) __extension__ ({ \ 53308 uint32x4_t __ret_479; \ 53309 uint32x4_t __s0_479 = __p0_479; \ 53310 uint16x8_t __s1_479 = __p1_479; \ 53311 uint16x8_t __s2_479 = __p2_479; \ 53312 uint32x4_t __rev0_479; __rev0_479 = __builtin_shufflevector(__s0_479, __s0_479, 3, 2, 1, 0); \ 53313 uint16x8_t __rev1_479; __rev1_479 = __builtin_shufflevector(__s1_479, __s1_479, 7, 6, 5, 4, 3, 2, 1, 0); \ 53314 uint16x8_t __rev2_479; __rev2_479 = __builtin_shufflevector(__s2_479, __s2_479, 7, 6, 5, 4, 3, 2, 1, 0); \ 53315 __ret_479 = __rev0_479 + __noswap_vmull_u16(__noswap_vget_high_u16(__rev1_479), __noswap_splat_laneq_u16(__rev2_479, __p3_479)); \ 53316 __ret_479 = __builtin_shufflevector(__ret_479, __ret_479, 3, 2, 1, 0); \ 53317 __ret_479; \ 53318 }) 53319 #endif 53320 53321 #ifdef __LITTLE_ENDIAN__ 53322 #define vmlal_high_laneq_s32(__p0_480, __p1_480, __p2_480, __p3_480) __extension__ ({ \ 53323 int64x2_t __ret_480; \ 53324 int64x2_t __s0_480 = __p0_480; \ 53325 int32x4_t __s1_480 = __p1_480; \ 53326 int32x4_t __s2_480 = __p2_480; \ 53327 __ret_480 = __s0_480 + vmull_s32(vget_high_s32(__s1_480), splat_laneq_s32(__s2_480, __p3_480)); \ 53328 __ret_480; \ 53329 }) 53330 #else 53331 #define vmlal_high_laneq_s32(__p0_481, __p1_481, __p2_481, __p3_481) __extension__ ({ \ 53332 int64x2_t __ret_481; \ 53333 int64x2_t __s0_481 = __p0_481; \ 53334 int32x4_t __s1_481 = __p1_481; \ 53335 int32x4_t __s2_481 = __p2_481; \ 53336 int64x2_t __rev0_481; __rev0_481 = __builtin_shufflevector(__s0_481, __s0_481, 1, 0); \ 53337 int32x4_t __rev1_481; __rev1_481 = __builtin_shufflevector(__s1_481, __s1_481, 3, 2, 1, 0); \ 53338 int32x4_t __rev2_481; __rev2_481 = __builtin_shufflevector(__s2_481, __s2_481, 3, 2, 1, 0); \ 53339 __ret_481 = __rev0_481 + __noswap_vmull_s32(__noswap_vget_high_s32(__rev1_481), __noswap_splat_laneq_s32(__rev2_481, __p3_481)); \ 53340 __ret_481 = __builtin_shufflevector(__ret_481, __ret_481, 1, 0); \ 53341 __ret_481; \ 53342 }) 53343 #endif 53344 53345 #ifdef __LITTLE_ENDIAN__ 53346 #define vmlal_high_laneq_s16(__p0_482, __p1_482, __p2_482, __p3_482) __extension__ ({ \ 53347 int32x4_t __ret_482; \ 53348 int32x4_t __s0_482 = __p0_482; \ 53349 int16x8_t __s1_482 = __p1_482; \ 53350 int16x8_t __s2_482 = __p2_482; \ 53351 __ret_482 = __s0_482 + vmull_s16(vget_high_s16(__s1_482), splat_laneq_s16(__s2_482, __p3_482)); \ 53352 __ret_482; \ 53353 }) 53354 #else 53355 #define vmlal_high_laneq_s16(__p0_483, __p1_483, __p2_483, __p3_483) __extension__ ({ \ 53356 int32x4_t __ret_483; \ 53357 int32x4_t __s0_483 = __p0_483; \ 53358 int16x8_t __s1_483 = __p1_483; \ 53359 int16x8_t __s2_483 = __p2_483; \ 53360 int32x4_t __rev0_483; __rev0_483 = __builtin_shufflevector(__s0_483, __s0_483, 3, 2, 1, 0); \ 53361 int16x8_t __rev1_483; __rev1_483 = __builtin_shufflevector(__s1_483, __s1_483, 7, 6, 5, 4, 3, 2, 1, 0); \ 53362 int16x8_t __rev2_483; __rev2_483 = __builtin_shufflevector(__s2_483, __s2_483, 7, 6, 5, 4, 3, 2, 1, 0); \ 53363 __ret_483 = __rev0_483 + __noswap_vmull_s16(__noswap_vget_high_s16(__rev1_483), __noswap_splat_laneq_s16(__rev2_483, __p3_483)); \ 53364 __ret_483 = __builtin_shufflevector(__ret_483, __ret_483, 3, 2, 1, 0); \ 53365 __ret_483; \ 53366 }) 53367 #endif 53368 53369 #ifdef __LITTLE_ENDIAN__ 53370 #define vmlal_laneq_u32(__p0_484, __p1_484, __p2_484, __p3_484) __extension__ ({ \ 53371 uint64x2_t __ret_484; \ 53372 uint64x2_t __s0_484 = __p0_484; \ 53373 uint32x2_t __s1_484 = __p1_484; \ 53374 uint32x4_t __s2_484 = __p2_484; \ 53375 __ret_484 = __s0_484 + vmull_u32(__s1_484, splat_laneq_u32(__s2_484, __p3_484)); \ 53376 __ret_484; \ 53377 }) 53378 #else 53379 #define vmlal_laneq_u32(__p0_485, __p1_485, __p2_485, __p3_485) __extension__ ({ \ 53380 uint64x2_t __ret_485; \ 53381 uint64x2_t __s0_485 = __p0_485; \ 53382 uint32x2_t __s1_485 = __p1_485; \ 53383 uint32x4_t __s2_485 = __p2_485; \ 53384 uint64x2_t __rev0_485; __rev0_485 = __builtin_shufflevector(__s0_485, __s0_485, 1, 0); \ 53385 uint32x2_t __rev1_485; __rev1_485 = __builtin_shufflevector(__s1_485, __s1_485, 1, 0); \ 53386 uint32x4_t __rev2_485; __rev2_485 = __builtin_shufflevector(__s2_485, __s2_485, 3, 2, 1, 0); \ 53387 __ret_485 = __rev0_485 + __noswap_vmull_u32(__rev1_485, __noswap_splat_laneq_u32(__rev2_485, __p3_485)); \ 53388 __ret_485 = __builtin_shufflevector(__ret_485, __ret_485, 1, 0); \ 53389 __ret_485; \ 53390 }) 53391 #endif 53392 53393 #ifdef __LITTLE_ENDIAN__ 53394 #define vmlal_laneq_u16(__p0_486, __p1_486, __p2_486, __p3_486) __extension__ ({ \ 53395 uint32x4_t __ret_486; \ 53396 uint32x4_t __s0_486 = __p0_486; \ 53397 uint16x4_t __s1_486 = __p1_486; \ 53398 uint16x8_t __s2_486 = __p2_486; \ 53399 __ret_486 = __s0_486 + vmull_u16(__s1_486, splat_laneq_u16(__s2_486, __p3_486)); \ 53400 __ret_486; \ 53401 }) 53402 #else 53403 #define vmlal_laneq_u16(__p0_487, __p1_487, __p2_487, __p3_487) __extension__ ({ \ 53404 uint32x4_t __ret_487; \ 53405 uint32x4_t __s0_487 = __p0_487; \ 53406 uint16x4_t __s1_487 = __p1_487; \ 53407 uint16x8_t __s2_487 = __p2_487; \ 53408 uint32x4_t __rev0_487; __rev0_487 = __builtin_shufflevector(__s0_487, __s0_487, 3, 2, 1, 0); \ 53409 uint16x4_t __rev1_487; __rev1_487 = __builtin_shufflevector(__s1_487, __s1_487, 3, 2, 1, 0); \ 53410 uint16x8_t __rev2_487; __rev2_487 = __builtin_shufflevector(__s2_487, __s2_487, 7, 6, 5, 4, 3, 2, 1, 0); \ 53411 __ret_487 = __rev0_487 + __noswap_vmull_u16(__rev1_487, __noswap_splat_laneq_u16(__rev2_487, __p3_487)); \ 53412 __ret_487 = __builtin_shufflevector(__ret_487, __ret_487, 3, 2, 1, 0); \ 53413 __ret_487; \ 53414 }) 53415 #endif 53416 53417 #ifdef __LITTLE_ENDIAN__ 53418 #define vmlal_laneq_s32(__p0_488, __p1_488, __p2_488, __p3_488) __extension__ ({ \ 53419 int64x2_t __ret_488; \ 53420 int64x2_t __s0_488 = __p0_488; \ 53421 int32x2_t __s1_488 = __p1_488; \ 53422 int32x4_t __s2_488 = __p2_488; \ 53423 __ret_488 = __s0_488 + vmull_s32(__s1_488, splat_laneq_s32(__s2_488, __p3_488)); \ 53424 __ret_488; \ 53425 }) 53426 #else 53427 #define vmlal_laneq_s32(__p0_489, __p1_489, __p2_489, __p3_489) __extension__ ({ \ 53428 int64x2_t __ret_489; \ 53429 int64x2_t __s0_489 = __p0_489; \ 53430 int32x2_t __s1_489 = __p1_489; \ 53431 int32x4_t __s2_489 = __p2_489; \ 53432 int64x2_t __rev0_489; __rev0_489 = __builtin_shufflevector(__s0_489, __s0_489, 1, 0); \ 53433 int32x2_t __rev1_489; __rev1_489 = __builtin_shufflevector(__s1_489, __s1_489, 1, 0); \ 53434 int32x4_t __rev2_489; __rev2_489 = __builtin_shufflevector(__s2_489, __s2_489, 3, 2, 1, 0); \ 53435 __ret_489 = __rev0_489 + __noswap_vmull_s32(__rev1_489, __noswap_splat_laneq_s32(__rev2_489, __p3_489)); \ 53436 __ret_489 = __builtin_shufflevector(__ret_489, __ret_489, 1, 0); \ 53437 __ret_489; \ 53438 }) 53439 #endif 53440 53441 #ifdef __LITTLE_ENDIAN__ 53442 #define vmlal_laneq_s16(__p0_490, __p1_490, __p2_490, __p3_490) __extension__ ({ \ 53443 int32x4_t __ret_490; \ 53444 int32x4_t __s0_490 = __p0_490; \ 53445 int16x4_t __s1_490 = __p1_490; \ 53446 int16x8_t __s2_490 = __p2_490; \ 53447 __ret_490 = __s0_490 + vmull_s16(__s1_490, splat_laneq_s16(__s2_490, __p3_490)); \ 53448 __ret_490; \ 53449 }) 53450 #else 53451 #define vmlal_laneq_s16(__p0_491, __p1_491, __p2_491, __p3_491) __extension__ ({ \ 53452 int32x4_t __ret_491; \ 53453 int32x4_t __s0_491 = __p0_491; \ 53454 int16x4_t __s1_491 = __p1_491; \ 53455 int16x8_t __s2_491 = __p2_491; \ 53456 int32x4_t __rev0_491; __rev0_491 = __builtin_shufflevector(__s0_491, __s0_491, 3, 2, 1, 0); \ 53457 int16x4_t __rev1_491; __rev1_491 = __builtin_shufflevector(__s1_491, __s1_491, 3, 2, 1, 0); \ 53458 int16x8_t __rev2_491; __rev2_491 = __builtin_shufflevector(__s2_491, __s2_491, 7, 6, 5, 4, 3, 2, 1, 0); \ 53459 __ret_491 = __rev0_491 + __noswap_vmull_s16(__rev1_491, __noswap_splat_laneq_s16(__rev2_491, __p3_491)); \ 53460 __ret_491 = __builtin_shufflevector(__ret_491, __ret_491, 3, 2, 1, 0); \ 53461 __ret_491; \ 53462 }) 53463 #endif 53464 53465 #ifdef __LITTLE_ENDIAN__ 53466 __ai __attribute__((target("neon"))) float64x2_t vmlsq_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) { 53467 float64x2_t __ret; 53468 __ret = __p0 - __p1 * __p2; 53469 return __ret; 53470 } 53471 #else 53472 __ai __attribute__((target("neon"))) float64x2_t vmlsq_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) { 53473 float64x2_t __ret; 53474 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 53475 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 53476 float64x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 53477 __ret = __rev0 - __rev1 * __rev2; 53478 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 53479 return __ret; 53480 } 53481 #endif 53482 53483 __ai __attribute__((target("neon"))) float64x1_t vmls_f64(float64x1_t __p0, float64x1_t __p1, float64x1_t __p2) { 53484 float64x1_t __ret; 53485 __ret = __p0 - __p1 * __p2; 53486 return __ret; 53487 } 53488 #ifdef __LITTLE_ENDIAN__ 53489 #define vmlsq_laneq_u32(__p0_492, __p1_492, __p2_492, __p3_492) __extension__ ({ \ 53490 uint32x4_t __ret_492; \ 53491 uint32x4_t __s0_492 = __p0_492; \ 53492 uint32x4_t __s1_492 = __p1_492; \ 53493 uint32x4_t __s2_492 = __p2_492; \ 53494 __ret_492 = __s0_492 - __s1_492 * splatq_laneq_u32(__s2_492, __p3_492); \ 53495 __ret_492; \ 53496 }) 53497 #else 53498 #define vmlsq_laneq_u32(__p0_493, __p1_493, __p2_493, __p3_493) __extension__ ({ \ 53499 uint32x4_t __ret_493; \ 53500 uint32x4_t __s0_493 = __p0_493; \ 53501 uint32x4_t __s1_493 = __p1_493; \ 53502 uint32x4_t __s2_493 = __p2_493; \ 53503 uint32x4_t __rev0_493; __rev0_493 = __builtin_shufflevector(__s0_493, __s0_493, 3, 2, 1, 0); \ 53504 uint32x4_t __rev1_493; __rev1_493 = __builtin_shufflevector(__s1_493, __s1_493, 3, 2, 1, 0); \ 53505 uint32x4_t __rev2_493; __rev2_493 = __builtin_shufflevector(__s2_493, __s2_493, 3, 2, 1, 0); \ 53506 __ret_493 = __rev0_493 - __rev1_493 * __noswap_splatq_laneq_u32(__rev2_493, __p3_493); \ 53507 __ret_493 = __builtin_shufflevector(__ret_493, __ret_493, 3, 2, 1, 0); \ 53508 __ret_493; \ 53509 }) 53510 #endif 53511 53512 #ifdef __LITTLE_ENDIAN__ 53513 #define vmlsq_laneq_u16(__p0_494, __p1_494, __p2_494, __p3_494) __extension__ ({ \ 53514 uint16x8_t __ret_494; \ 53515 uint16x8_t __s0_494 = __p0_494; \ 53516 uint16x8_t __s1_494 = __p1_494; \ 53517 uint16x8_t __s2_494 = __p2_494; \ 53518 __ret_494 = __s0_494 - __s1_494 * splatq_laneq_u16(__s2_494, __p3_494); \ 53519 __ret_494; \ 53520 }) 53521 #else 53522 #define vmlsq_laneq_u16(__p0_495, __p1_495, __p2_495, __p3_495) __extension__ ({ \ 53523 uint16x8_t __ret_495; \ 53524 uint16x8_t __s0_495 = __p0_495; \ 53525 uint16x8_t __s1_495 = __p1_495; \ 53526 uint16x8_t __s2_495 = __p2_495; \ 53527 uint16x8_t __rev0_495; __rev0_495 = __builtin_shufflevector(__s0_495, __s0_495, 7, 6, 5, 4, 3, 2, 1, 0); \ 53528 uint16x8_t __rev1_495; __rev1_495 = __builtin_shufflevector(__s1_495, __s1_495, 7, 6, 5, 4, 3, 2, 1, 0); \ 53529 uint16x8_t __rev2_495; __rev2_495 = __builtin_shufflevector(__s2_495, __s2_495, 7, 6, 5, 4, 3, 2, 1, 0); \ 53530 __ret_495 = __rev0_495 - __rev1_495 * __noswap_splatq_laneq_u16(__rev2_495, __p3_495); \ 53531 __ret_495 = __builtin_shufflevector(__ret_495, __ret_495, 7, 6, 5, 4, 3, 2, 1, 0); \ 53532 __ret_495; \ 53533 }) 53534 #endif 53535 53536 #ifdef __LITTLE_ENDIAN__ 53537 #define vmlsq_laneq_f32(__p0_496, __p1_496, __p2_496, __p3_496) __extension__ ({ \ 53538 float32x4_t __ret_496; \ 53539 float32x4_t __s0_496 = __p0_496; \ 53540 float32x4_t __s1_496 = __p1_496; \ 53541 float32x4_t __s2_496 = __p2_496; \ 53542 __ret_496 = __s0_496 - __s1_496 * splatq_laneq_f32(__s2_496, __p3_496); \ 53543 __ret_496; \ 53544 }) 53545 #else 53546 #define vmlsq_laneq_f32(__p0_497, __p1_497, __p2_497, __p3_497) __extension__ ({ \ 53547 float32x4_t __ret_497; \ 53548 float32x4_t __s0_497 = __p0_497; \ 53549 float32x4_t __s1_497 = __p1_497; \ 53550 float32x4_t __s2_497 = __p2_497; \ 53551 float32x4_t __rev0_497; __rev0_497 = __builtin_shufflevector(__s0_497, __s0_497, 3, 2, 1, 0); \ 53552 float32x4_t __rev1_497; __rev1_497 = __builtin_shufflevector(__s1_497, __s1_497, 3, 2, 1, 0); \ 53553 float32x4_t __rev2_497; __rev2_497 = __builtin_shufflevector(__s2_497, __s2_497, 3, 2, 1, 0); \ 53554 __ret_497 = __rev0_497 - __rev1_497 * __noswap_splatq_laneq_f32(__rev2_497, __p3_497); \ 53555 __ret_497 = __builtin_shufflevector(__ret_497, __ret_497, 3, 2, 1, 0); \ 53556 __ret_497; \ 53557 }) 53558 #endif 53559 53560 #ifdef __LITTLE_ENDIAN__ 53561 #define vmlsq_laneq_s32(__p0_498, __p1_498, __p2_498, __p3_498) __extension__ ({ \ 53562 int32x4_t __ret_498; \ 53563 int32x4_t __s0_498 = __p0_498; \ 53564 int32x4_t __s1_498 = __p1_498; \ 53565 int32x4_t __s2_498 = __p2_498; \ 53566 __ret_498 = __s0_498 - __s1_498 * splatq_laneq_s32(__s2_498, __p3_498); \ 53567 __ret_498; \ 53568 }) 53569 #else 53570 #define vmlsq_laneq_s32(__p0_499, __p1_499, __p2_499, __p3_499) __extension__ ({ \ 53571 int32x4_t __ret_499; \ 53572 int32x4_t __s0_499 = __p0_499; \ 53573 int32x4_t __s1_499 = __p1_499; \ 53574 int32x4_t __s2_499 = __p2_499; \ 53575 int32x4_t __rev0_499; __rev0_499 = __builtin_shufflevector(__s0_499, __s0_499, 3, 2, 1, 0); \ 53576 int32x4_t __rev1_499; __rev1_499 = __builtin_shufflevector(__s1_499, __s1_499, 3, 2, 1, 0); \ 53577 int32x4_t __rev2_499; __rev2_499 = __builtin_shufflevector(__s2_499, __s2_499, 3, 2, 1, 0); \ 53578 __ret_499 = __rev0_499 - __rev1_499 * __noswap_splatq_laneq_s32(__rev2_499, __p3_499); \ 53579 __ret_499 = __builtin_shufflevector(__ret_499, __ret_499, 3, 2, 1, 0); \ 53580 __ret_499; \ 53581 }) 53582 #endif 53583 53584 #ifdef __LITTLE_ENDIAN__ 53585 #define vmlsq_laneq_s16(__p0_500, __p1_500, __p2_500, __p3_500) __extension__ ({ \ 53586 int16x8_t __ret_500; \ 53587 int16x8_t __s0_500 = __p0_500; \ 53588 int16x8_t __s1_500 = __p1_500; \ 53589 int16x8_t __s2_500 = __p2_500; \ 53590 __ret_500 = __s0_500 - __s1_500 * splatq_laneq_s16(__s2_500, __p3_500); \ 53591 __ret_500; \ 53592 }) 53593 #else 53594 #define vmlsq_laneq_s16(__p0_501, __p1_501, __p2_501, __p3_501) __extension__ ({ \ 53595 int16x8_t __ret_501; \ 53596 int16x8_t __s0_501 = __p0_501; \ 53597 int16x8_t __s1_501 = __p1_501; \ 53598 int16x8_t __s2_501 = __p2_501; \ 53599 int16x8_t __rev0_501; __rev0_501 = __builtin_shufflevector(__s0_501, __s0_501, 7, 6, 5, 4, 3, 2, 1, 0); \ 53600 int16x8_t __rev1_501; __rev1_501 = __builtin_shufflevector(__s1_501, __s1_501, 7, 6, 5, 4, 3, 2, 1, 0); \ 53601 int16x8_t __rev2_501; __rev2_501 = __builtin_shufflevector(__s2_501, __s2_501, 7, 6, 5, 4, 3, 2, 1, 0); \ 53602 __ret_501 = __rev0_501 - __rev1_501 * __noswap_splatq_laneq_s16(__rev2_501, __p3_501); \ 53603 __ret_501 = __builtin_shufflevector(__ret_501, __ret_501, 7, 6, 5, 4, 3, 2, 1, 0); \ 53604 __ret_501; \ 53605 }) 53606 #endif 53607 53608 #ifdef __LITTLE_ENDIAN__ 53609 #define vmls_laneq_u32(__p0_502, __p1_502, __p2_502, __p3_502) __extension__ ({ \ 53610 uint32x2_t __ret_502; \ 53611 uint32x2_t __s0_502 = __p0_502; \ 53612 uint32x2_t __s1_502 = __p1_502; \ 53613 uint32x4_t __s2_502 = __p2_502; \ 53614 __ret_502 = __s0_502 - __s1_502 * splat_laneq_u32(__s2_502, __p3_502); \ 53615 __ret_502; \ 53616 }) 53617 #else 53618 #define vmls_laneq_u32(__p0_503, __p1_503, __p2_503, __p3_503) __extension__ ({ \ 53619 uint32x2_t __ret_503; \ 53620 uint32x2_t __s0_503 = __p0_503; \ 53621 uint32x2_t __s1_503 = __p1_503; \ 53622 uint32x4_t __s2_503 = __p2_503; \ 53623 uint32x2_t __rev0_503; __rev0_503 = __builtin_shufflevector(__s0_503, __s0_503, 1, 0); \ 53624 uint32x2_t __rev1_503; __rev1_503 = __builtin_shufflevector(__s1_503, __s1_503, 1, 0); \ 53625 uint32x4_t __rev2_503; __rev2_503 = __builtin_shufflevector(__s2_503, __s2_503, 3, 2, 1, 0); \ 53626 __ret_503 = __rev0_503 - __rev1_503 * __noswap_splat_laneq_u32(__rev2_503, __p3_503); \ 53627 __ret_503 = __builtin_shufflevector(__ret_503, __ret_503, 1, 0); \ 53628 __ret_503; \ 53629 }) 53630 #endif 53631 53632 #ifdef __LITTLE_ENDIAN__ 53633 #define vmls_laneq_u16(__p0_504, __p1_504, __p2_504, __p3_504) __extension__ ({ \ 53634 uint16x4_t __ret_504; \ 53635 uint16x4_t __s0_504 = __p0_504; \ 53636 uint16x4_t __s1_504 = __p1_504; \ 53637 uint16x8_t __s2_504 = __p2_504; \ 53638 __ret_504 = __s0_504 - __s1_504 * splat_laneq_u16(__s2_504, __p3_504); \ 53639 __ret_504; \ 53640 }) 53641 #else 53642 #define vmls_laneq_u16(__p0_505, __p1_505, __p2_505, __p3_505) __extension__ ({ \ 53643 uint16x4_t __ret_505; \ 53644 uint16x4_t __s0_505 = __p0_505; \ 53645 uint16x4_t __s1_505 = __p1_505; \ 53646 uint16x8_t __s2_505 = __p2_505; \ 53647 uint16x4_t __rev0_505; __rev0_505 = __builtin_shufflevector(__s0_505, __s0_505, 3, 2, 1, 0); \ 53648 uint16x4_t __rev1_505; __rev1_505 = __builtin_shufflevector(__s1_505, __s1_505, 3, 2, 1, 0); \ 53649 uint16x8_t __rev2_505; __rev2_505 = __builtin_shufflevector(__s2_505, __s2_505, 7, 6, 5, 4, 3, 2, 1, 0); \ 53650 __ret_505 = __rev0_505 - __rev1_505 * __noswap_splat_laneq_u16(__rev2_505, __p3_505); \ 53651 __ret_505 = __builtin_shufflevector(__ret_505, __ret_505, 3, 2, 1, 0); \ 53652 __ret_505; \ 53653 }) 53654 #endif 53655 53656 #ifdef __LITTLE_ENDIAN__ 53657 #define vmls_laneq_f32(__p0_506, __p1_506, __p2_506, __p3_506) __extension__ ({ \ 53658 float32x2_t __ret_506; \ 53659 float32x2_t __s0_506 = __p0_506; \ 53660 float32x2_t __s1_506 = __p1_506; \ 53661 float32x4_t __s2_506 = __p2_506; \ 53662 __ret_506 = __s0_506 - __s1_506 * splat_laneq_f32(__s2_506, __p3_506); \ 53663 __ret_506; \ 53664 }) 53665 #else 53666 #define vmls_laneq_f32(__p0_507, __p1_507, __p2_507, __p3_507) __extension__ ({ \ 53667 float32x2_t __ret_507; \ 53668 float32x2_t __s0_507 = __p0_507; \ 53669 float32x2_t __s1_507 = __p1_507; \ 53670 float32x4_t __s2_507 = __p2_507; \ 53671 float32x2_t __rev0_507; __rev0_507 = __builtin_shufflevector(__s0_507, __s0_507, 1, 0); \ 53672 float32x2_t __rev1_507; __rev1_507 = __builtin_shufflevector(__s1_507, __s1_507, 1, 0); \ 53673 float32x4_t __rev2_507; __rev2_507 = __builtin_shufflevector(__s2_507, __s2_507, 3, 2, 1, 0); \ 53674 __ret_507 = __rev0_507 - __rev1_507 * __noswap_splat_laneq_f32(__rev2_507, __p3_507); \ 53675 __ret_507 = __builtin_shufflevector(__ret_507, __ret_507, 1, 0); \ 53676 __ret_507; \ 53677 }) 53678 #endif 53679 53680 #ifdef __LITTLE_ENDIAN__ 53681 #define vmls_laneq_s32(__p0_508, __p1_508, __p2_508, __p3_508) __extension__ ({ \ 53682 int32x2_t __ret_508; \ 53683 int32x2_t __s0_508 = __p0_508; \ 53684 int32x2_t __s1_508 = __p1_508; \ 53685 int32x4_t __s2_508 = __p2_508; \ 53686 __ret_508 = __s0_508 - __s1_508 * splat_laneq_s32(__s2_508, __p3_508); \ 53687 __ret_508; \ 53688 }) 53689 #else 53690 #define vmls_laneq_s32(__p0_509, __p1_509, __p2_509, __p3_509) __extension__ ({ \ 53691 int32x2_t __ret_509; \ 53692 int32x2_t __s0_509 = __p0_509; \ 53693 int32x2_t __s1_509 = __p1_509; \ 53694 int32x4_t __s2_509 = __p2_509; \ 53695 int32x2_t __rev0_509; __rev0_509 = __builtin_shufflevector(__s0_509, __s0_509, 1, 0); \ 53696 int32x2_t __rev1_509; __rev1_509 = __builtin_shufflevector(__s1_509, __s1_509, 1, 0); \ 53697 int32x4_t __rev2_509; __rev2_509 = __builtin_shufflevector(__s2_509, __s2_509, 3, 2, 1, 0); \ 53698 __ret_509 = __rev0_509 - __rev1_509 * __noswap_splat_laneq_s32(__rev2_509, __p3_509); \ 53699 __ret_509 = __builtin_shufflevector(__ret_509, __ret_509, 1, 0); \ 53700 __ret_509; \ 53701 }) 53702 #endif 53703 53704 #ifdef __LITTLE_ENDIAN__ 53705 #define vmls_laneq_s16(__p0_510, __p1_510, __p2_510, __p3_510) __extension__ ({ \ 53706 int16x4_t __ret_510; \ 53707 int16x4_t __s0_510 = __p0_510; \ 53708 int16x4_t __s1_510 = __p1_510; \ 53709 int16x8_t __s2_510 = __p2_510; \ 53710 __ret_510 = __s0_510 - __s1_510 * splat_laneq_s16(__s2_510, __p3_510); \ 53711 __ret_510; \ 53712 }) 53713 #else 53714 #define vmls_laneq_s16(__p0_511, __p1_511, __p2_511, __p3_511) __extension__ ({ \ 53715 int16x4_t __ret_511; \ 53716 int16x4_t __s0_511 = __p0_511; \ 53717 int16x4_t __s1_511 = __p1_511; \ 53718 int16x8_t __s2_511 = __p2_511; \ 53719 int16x4_t __rev0_511; __rev0_511 = __builtin_shufflevector(__s0_511, __s0_511, 3, 2, 1, 0); \ 53720 int16x4_t __rev1_511; __rev1_511 = __builtin_shufflevector(__s1_511, __s1_511, 3, 2, 1, 0); \ 53721 int16x8_t __rev2_511; __rev2_511 = __builtin_shufflevector(__s2_511, __s2_511, 7, 6, 5, 4, 3, 2, 1, 0); \ 53722 __ret_511 = __rev0_511 - __rev1_511 * __noswap_splat_laneq_s16(__rev2_511, __p3_511); \ 53723 __ret_511 = __builtin_shufflevector(__ret_511, __ret_511, 3, 2, 1, 0); \ 53724 __ret_511; \ 53725 }) 53726 #endif 53727 53728 #ifdef __LITTLE_ENDIAN__ 53729 #define vmlsl_high_lane_u32(__p0_512, __p1_512, __p2_512, __p3_512) __extension__ ({ \ 53730 uint64x2_t __ret_512; \ 53731 uint64x2_t __s0_512 = __p0_512; \ 53732 uint32x4_t __s1_512 = __p1_512; \ 53733 uint32x2_t __s2_512 = __p2_512; \ 53734 __ret_512 = __s0_512 - vmull_u32(vget_high_u32(__s1_512), splat_lane_u32(__s2_512, __p3_512)); \ 53735 __ret_512; \ 53736 }) 53737 #else 53738 #define vmlsl_high_lane_u32(__p0_513, __p1_513, __p2_513, __p3_513) __extension__ ({ \ 53739 uint64x2_t __ret_513; \ 53740 uint64x2_t __s0_513 = __p0_513; \ 53741 uint32x4_t __s1_513 = __p1_513; \ 53742 uint32x2_t __s2_513 = __p2_513; \ 53743 uint64x2_t __rev0_513; __rev0_513 = __builtin_shufflevector(__s0_513, __s0_513, 1, 0); \ 53744 uint32x4_t __rev1_513; __rev1_513 = __builtin_shufflevector(__s1_513, __s1_513, 3, 2, 1, 0); \ 53745 uint32x2_t __rev2_513; __rev2_513 = __builtin_shufflevector(__s2_513, __s2_513, 1, 0); \ 53746 __ret_513 = __rev0_513 - __noswap_vmull_u32(__noswap_vget_high_u32(__rev1_513), __noswap_splat_lane_u32(__rev2_513, __p3_513)); \ 53747 __ret_513 = __builtin_shufflevector(__ret_513, __ret_513, 1, 0); \ 53748 __ret_513; \ 53749 }) 53750 #endif 53751 53752 #ifdef __LITTLE_ENDIAN__ 53753 #define vmlsl_high_lane_u16(__p0_514, __p1_514, __p2_514, __p3_514) __extension__ ({ \ 53754 uint32x4_t __ret_514; \ 53755 uint32x4_t __s0_514 = __p0_514; \ 53756 uint16x8_t __s1_514 = __p1_514; \ 53757 uint16x4_t __s2_514 = __p2_514; \ 53758 __ret_514 = __s0_514 - vmull_u16(vget_high_u16(__s1_514), splat_lane_u16(__s2_514, __p3_514)); \ 53759 __ret_514; \ 53760 }) 53761 #else 53762 #define vmlsl_high_lane_u16(__p0_515, __p1_515, __p2_515, __p3_515) __extension__ ({ \ 53763 uint32x4_t __ret_515; \ 53764 uint32x4_t __s0_515 = __p0_515; \ 53765 uint16x8_t __s1_515 = __p1_515; \ 53766 uint16x4_t __s2_515 = __p2_515; \ 53767 uint32x4_t __rev0_515; __rev0_515 = __builtin_shufflevector(__s0_515, __s0_515, 3, 2, 1, 0); \ 53768 uint16x8_t __rev1_515; __rev1_515 = __builtin_shufflevector(__s1_515, __s1_515, 7, 6, 5, 4, 3, 2, 1, 0); \ 53769 uint16x4_t __rev2_515; __rev2_515 = __builtin_shufflevector(__s2_515, __s2_515, 3, 2, 1, 0); \ 53770 __ret_515 = __rev0_515 - __noswap_vmull_u16(__noswap_vget_high_u16(__rev1_515), __noswap_splat_lane_u16(__rev2_515, __p3_515)); \ 53771 __ret_515 = __builtin_shufflevector(__ret_515, __ret_515, 3, 2, 1, 0); \ 53772 __ret_515; \ 53773 }) 53774 #endif 53775 53776 #ifdef __LITTLE_ENDIAN__ 53777 #define vmlsl_high_lane_s32(__p0_516, __p1_516, __p2_516, __p3_516) __extension__ ({ \ 53778 int64x2_t __ret_516; \ 53779 int64x2_t __s0_516 = __p0_516; \ 53780 int32x4_t __s1_516 = __p1_516; \ 53781 int32x2_t __s2_516 = __p2_516; \ 53782 __ret_516 = __s0_516 - vmull_s32(vget_high_s32(__s1_516), splat_lane_s32(__s2_516, __p3_516)); \ 53783 __ret_516; \ 53784 }) 53785 #else 53786 #define vmlsl_high_lane_s32(__p0_517, __p1_517, __p2_517, __p3_517) __extension__ ({ \ 53787 int64x2_t __ret_517; \ 53788 int64x2_t __s0_517 = __p0_517; \ 53789 int32x4_t __s1_517 = __p1_517; \ 53790 int32x2_t __s2_517 = __p2_517; \ 53791 int64x2_t __rev0_517; __rev0_517 = __builtin_shufflevector(__s0_517, __s0_517, 1, 0); \ 53792 int32x4_t __rev1_517; __rev1_517 = __builtin_shufflevector(__s1_517, __s1_517, 3, 2, 1, 0); \ 53793 int32x2_t __rev2_517; __rev2_517 = __builtin_shufflevector(__s2_517, __s2_517, 1, 0); \ 53794 __ret_517 = __rev0_517 - __noswap_vmull_s32(__noswap_vget_high_s32(__rev1_517), __noswap_splat_lane_s32(__rev2_517, __p3_517)); \ 53795 __ret_517 = __builtin_shufflevector(__ret_517, __ret_517, 1, 0); \ 53796 __ret_517; \ 53797 }) 53798 #endif 53799 53800 #ifdef __LITTLE_ENDIAN__ 53801 #define vmlsl_high_lane_s16(__p0_518, __p1_518, __p2_518, __p3_518) __extension__ ({ \ 53802 int32x4_t __ret_518; \ 53803 int32x4_t __s0_518 = __p0_518; \ 53804 int16x8_t __s1_518 = __p1_518; \ 53805 int16x4_t __s2_518 = __p2_518; \ 53806 __ret_518 = __s0_518 - vmull_s16(vget_high_s16(__s1_518), splat_lane_s16(__s2_518, __p3_518)); \ 53807 __ret_518; \ 53808 }) 53809 #else 53810 #define vmlsl_high_lane_s16(__p0_519, __p1_519, __p2_519, __p3_519) __extension__ ({ \ 53811 int32x4_t __ret_519; \ 53812 int32x4_t __s0_519 = __p0_519; \ 53813 int16x8_t __s1_519 = __p1_519; \ 53814 int16x4_t __s2_519 = __p2_519; \ 53815 int32x4_t __rev0_519; __rev0_519 = __builtin_shufflevector(__s0_519, __s0_519, 3, 2, 1, 0); \ 53816 int16x8_t __rev1_519; __rev1_519 = __builtin_shufflevector(__s1_519, __s1_519, 7, 6, 5, 4, 3, 2, 1, 0); \ 53817 int16x4_t __rev2_519; __rev2_519 = __builtin_shufflevector(__s2_519, __s2_519, 3, 2, 1, 0); \ 53818 __ret_519 = __rev0_519 - __noswap_vmull_s16(__noswap_vget_high_s16(__rev1_519), __noswap_splat_lane_s16(__rev2_519, __p3_519)); \ 53819 __ret_519 = __builtin_shufflevector(__ret_519, __ret_519, 3, 2, 1, 0); \ 53820 __ret_519; \ 53821 }) 53822 #endif 53823 53824 #ifdef __LITTLE_ENDIAN__ 53825 #define vmlsl_high_laneq_u32(__p0_520, __p1_520, __p2_520, __p3_520) __extension__ ({ \ 53826 uint64x2_t __ret_520; \ 53827 uint64x2_t __s0_520 = __p0_520; \ 53828 uint32x4_t __s1_520 = __p1_520; \ 53829 uint32x4_t __s2_520 = __p2_520; \ 53830 __ret_520 = __s0_520 - vmull_u32(vget_high_u32(__s1_520), splat_laneq_u32(__s2_520, __p3_520)); \ 53831 __ret_520; \ 53832 }) 53833 #else 53834 #define vmlsl_high_laneq_u32(__p0_521, __p1_521, __p2_521, __p3_521) __extension__ ({ \ 53835 uint64x2_t __ret_521; \ 53836 uint64x2_t __s0_521 = __p0_521; \ 53837 uint32x4_t __s1_521 = __p1_521; \ 53838 uint32x4_t __s2_521 = __p2_521; \ 53839 uint64x2_t __rev0_521; __rev0_521 = __builtin_shufflevector(__s0_521, __s0_521, 1, 0); \ 53840 uint32x4_t __rev1_521; __rev1_521 = __builtin_shufflevector(__s1_521, __s1_521, 3, 2, 1, 0); \ 53841 uint32x4_t __rev2_521; __rev2_521 = __builtin_shufflevector(__s2_521, __s2_521, 3, 2, 1, 0); \ 53842 __ret_521 = __rev0_521 - __noswap_vmull_u32(__noswap_vget_high_u32(__rev1_521), __noswap_splat_laneq_u32(__rev2_521, __p3_521)); \ 53843 __ret_521 = __builtin_shufflevector(__ret_521, __ret_521, 1, 0); \ 53844 __ret_521; \ 53845 }) 53846 #endif 53847 53848 #ifdef __LITTLE_ENDIAN__ 53849 #define vmlsl_high_laneq_u16(__p0_522, __p1_522, __p2_522, __p3_522) __extension__ ({ \ 53850 uint32x4_t __ret_522; \ 53851 uint32x4_t __s0_522 = __p0_522; \ 53852 uint16x8_t __s1_522 = __p1_522; \ 53853 uint16x8_t __s2_522 = __p2_522; \ 53854 __ret_522 = __s0_522 - vmull_u16(vget_high_u16(__s1_522), splat_laneq_u16(__s2_522, __p3_522)); \ 53855 __ret_522; \ 53856 }) 53857 #else 53858 #define vmlsl_high_laneq_u16(__p0_523, __p1_523, __p2_523, __p3_523) __extension__ ({ \ 53859 uint32x4_t __ret_523; \ 53860 uint32x4_t __s0_523 = __p0_523; \ 53861 uint16x8_t __s1_523 = __p1_523; \ 53862 uint16x8_t __s2_523 = __p2_523; \ 53863 uint32x4_t __rev0_523; __rev0_523 = __builtin_shufflevector(__s0_523, __s0_523, 3, 2, 1, 0); \ 53864 uint16x8_t __rev1_523; __rev1_523 = __builtin_shufflevector(__s1_523, __s1_523, 7, 6, 5, 4, 3, 2, 1, 0); \ 53865 uint16x8_t __rev2_523; __rev2_523 = __builtin_shufflevector(__s2_523, __s2_523, 7, 6, 5, 4, 3, 2, 1, 0); \ 53866 __ret_523 = __rev0_523 - __noswap_vmull_u16(__noswap_vget_high_u16(__rev1_523), __noswap_splat_laneq_u16(__rev2_523, __p3_523)); \ 53867 __ret_523 = __builtin_shufflevector(__ret_523, __ret_523, 3, 2, 1, 0); \ 53868 __ret_523; \ 53869 }) 53870 #endif 53871 53872 #ifdef __LITTLE_ENDIAN__ 53873 #define vmlsl_high_laneq_s32(__p0_524, __p1_524, __p2_524, __p3_524) __extension__ ({ \ 53874 int64x2_t __ret_524; \ 53875 int64x2_t __s0_524 = __p0_524; \ 53876 int32x4_t __s1_524 = __p1_524; \ 53877 int32x4_t __s2_524 = __p2_524; \ 53878 __ret_524 = __s0_524 - vmull_s32(vget_high_s32(__s1_524), splat_laneq_s32(__s2_524, __p3_524)); \ 53879 __ret_524; \ 53880 }) 53881 #else 53882 #define vmlsl_high_laneq_s32(__p0_525, __p1_525, __p2_525, __p3_525) __extension__ ({ \ 53883 int64x2_t __ret_525; \ 53884 int64x2_t __s0_525 = __p0_525; \ 53885 int32x4_t __s1_525 = __p1_525; \ 53886 int32x4_t __s2_525 = __p2_525; \ 53887 int64x2_t __rev0_525; __rev0_525 = __builtin_shufflevector(__s0_525, __s0_525, 1, 0); \ 53888 int32x4_t __rev1_525; __rev1_525 = __builtin_shufflevector(__s1_525, __s1_525, 3, 2, 1, 0); \ 53889 int32x4_t __rev2_525; __rev2_525 = __builtin_shufflevector(__s2_525, __s2_525, 3, 2, 1, 0); \ 53890 __ret_525 = __rev0_525 - __noswap_vmull_s32(__noswap_vget_high_s32(__rev1_525), __noswap_splat_laneq_s32(__rev2_525, __p3_525)); \ 53891 __ret_525 = __builtin_shufflevector(__ret_525, __ret_525, 1, 0); \ 53892 __ret_525; \ 53893 }) 53894 #endif 53895 53896 #ifdef __LITTLE_ENDIAN__ 53897 #define vmlsl_high_laneq_s16(__p0_526, __p1_526, __p2_526, __p3_526) __extension__ ({ \ 53898 int32x4_t __ret_526; \ 53899 int32x4_t __s0_526 = __p0_526; \ 53900 int16x8_t __s1_526 = __p1_526; \ 53901 int16x8_t __s2_526 = __p2_526; \ 53902 __ret_526 = __s0_526 - vmull_s16(vget_high_s16(__s1_526), splat_laneq_s16(__s2_526, __p3_526)); \ 53903 __ret_526; \ 53904 }) 53905 #else 53906 #define vmlsl_high_laneq_s16(__p0_527, __p1_527, __p2_527, __p3_527) __extension__ ({ \ 53907 int32x4_t __ret_527; \ 53908 int32x4_t __s0_527 = __p0_527; \ 53909 int16x8_t __s1_527 = __p1_527; \ 53910 int16x8_t __s2_527 = __p2_527; \ 53911 int32x4_t __rev0_527; __rev0_527 = __builtin_shufflevector(__s0_527, __s0_527, 3, 2, 1, 0); \ 53912 int16x8_t __rev1_527; __rev1_527 = __builtin_shufflevector(__s1_527, __s1_527, 7, 6, 5, 4, 3, 2, 1, 0); \ 53913 int16x8_t __rev2_527; __rev2_527 = __builtin_shufflevector(__s2_527, __s2_527, 7, 6, 5, 4, 3, 2, 1, 0); \ 53914 __ret_527 = __rev0_527 - __noswap_vmull_s16(__noswap_vget_high_s16(__rev1_527), __noswap_splat_laneq_s16(__rev2_527, __p3_527)); \ 53915 __ret_527 = __builtin_shufflevector(__ret_527, __ret_527, 3, 2, 1, 0); \ 53916 __ret_527; \ 53917 }) 53918 #endif 53919 53920 #ifdef __LITTLE_ENDIAN__ 53921 #define vmlsl_laneq_u32(__p0_528, __p1_528, __p2_528, __p3_528) __extension__ ({ \ 53922 uint64x2_t __ret_528; \ 53923 uint64x2_t __s0_528 = __p0_528; \ 53924 uint32x2_t __s1_528 = __p1_528; \ 53925 uint32x4_t __s2_528 = __p2_528; \ 53926 __ret_528 = __s0_528 - vmull_u32(__s1_528, splat_laneq_u32(__s2_528, __p3_528)); \ 53927 __ret_528; \ 53928 }) 53929 #else 53930 #define vmlsl_laneq_u32(__p0_529, __p1_529, __p2_529, __p3_529) __extension__ ({ \ 53931 uint64x2_t __ret_529; \ 53932 uint64x2_t __s0_529 = __p0_529; \ 53933 uint32x2_t __s1_529 = __p1_529; \ 53934 uint32x4_t __s2_529 = __p2_529; \ 53935 uint64x2_t __rev0_529; __rev0_529 = __builtin_shufflevector(__s0_529, __s0_529, 1, 0); \ 53936 uint32x2_t __rev1_529; __rev1_529 = __builtin_shufflevector(__s1_529, __s1_529, 1, 0); \ 53937 uint32x4_t __rev2_529; __rev2_529 = __builtin_shufflevector(__s2_529, __s2_529, 3, 2, 1, 0); \ 53938 __ret_529 = __rev0_529 - __noswap_vmull_u32(__rev1_529, __noswap_splat_laneq_u32(__rev2_529, __p3_529)); \ 53939 __ret_529 = __builtin_shufflevector(__ret_529, __ret_529, 1, 0); \ 53940 __ret_529; \ 53941 }) 53942 #endif 53943 53944 #ifdef __LITTLE_ENDIAN__ 53945 #define vmlsl_laneq_u16(__p0_530, __p1_530, __p2_530, __p3_530) __extension__ ({ \ 53946 uint32x4_t __ret_530; \ 53947 uint32x4_t __s0_530 = __p0_530; \ 53948 uint16x4_t __s1_530 = __p1_530; \ 53949 uint16x8_t __s2_530 = __p2_530; \ 53950 __ret_530 = __s0_530 - vmull_u16(__s1_530, splat_laneq_u16(__s2_530, __p3_530)); \ 53951 __ret_530; \ 53952 }) 53953 #else 53954 #define vmlsl_laneq_u16(__p0_531, __p1_531, __p2_531, __p3_531) __extension__ ({ \ 53955 uint32x4_t __ret_531; \ 53956 uint32x4_t __s0_531 = __p0_531; \ 53957 uint16x4_t __s1_531 = __p1_531; \ 53958 uint16x8_t __s2_531 = __p2_531; \ 53959 uint32x4_t __rev0_531; __rev0_531 = __builtin_shufflevector(__s0_531, __s0_531, 3, 2, 1, 0); \ 53960 uint16x4_t __rev1_531; __rev1_531 = __builtin_shufflevector(__s1_531, __s1_531, 3, 2, 1, 0); \ 53961 uint16x8_t __rev2_531; __rev2_531 = __builtin_shufflevector(__s2_531, __s2_531, 7, 6, 5, 4, 3, 2, 1, 0); \ 53962 __ret_531 = __rev0_531 - __noswap_vmull_u16(__rev1_531, __noswap_splat_laneq_u16(__rev2_531, __p3_531)); \ 53963 __ret_531 = __builtin_shufflevector(__ret_531, __ret_531, 3, 2, 1, 0); \ 53964 __ret_531; \ 53965 }) 53966 #endif 53967 53968 #ifdef __LITTLE_ENDIAN__ 53969 #define vmlsl_laneq_s32(__p0_532, __p1_532, __p2_532, __p3_532) __extension__ ({ \ 53970 int64x2_t __ret_532; \ 53971 int64x2_t __s0_532 = __p0_532; \ 53972 int32x2_t __s1_532 = __p1_532; \ 53973 int32x4_t __s2_532 = __p2_532; \ 53974 __ret_532 = __s0_532 - vmull_s32(__s1_532, splat_laneq_s32(__s2_532, __p3_532)); \ 53975 __ret_532; \ 53976 }) 53977 #else 53978 #define vmlsl_laneq_s32(__p0_533, __p1_533, __p2_533, __p3_533) __extension__ ({ \ 53979 int64x2_t __ret_533; \ 53980 int64x2_t __s0_533 = __p0_533; \ 53981 int32x2_t __s1_533 = __p1_533; \ 53982 int32x4_t __s2_533 = __p2_533; \ 53983 int64x2_t __rev0_533; __rev0_533 = __builtin_shufflevector(__s0_533, __s0_533, 1, 0); \ 53984 int32x2_t __rev1_533; __rev1_533 = __builtin_shufflevector(__s1_533, __s1_533, 1, 0); \ 53985 int32x4_t __rev2_533; __rev2_533 = __builtin_shufflevector(__s2_533, __s2_533, 3, 2, 1, 0); \ 53986 __ret_533 = __rev0_533 - __noswap_vmull_s32(__rev1_533, __noswap_splat_laneq_s32(__rev2_533, __p3_533)); \ 53987 __ret_533 = __builtin_shufflevector(__ret_533, __ret_533, 1, 0); \ 53988 __ret_533; \ 53989 }) 53990 #endif 53991 53992 #ifdef __LITTLE_ENDIAN__ 53993 #define vmlsl_laneq_s16(__p0_534, __p1_534, __p2_534, __p3_534) __extension__ ({ \ 53994 int32x4_t __ret_534; \ 53995 int32x4_t __s0_534 = __p0_534; \ 53996 int16x4_t __s1_534 = __p1_534; \ 53997 int16x8_t __s2_534 = __p2_534; \ 53998 __ret_534 = __s0_534 - vmull_s16(__s1_534, splat_laneq_s16(__s2_534, __p3_534)); \ 53999 __ret_534; \ 54000 }) 54001 #else 54002 #define vmlsl_laneq_s16(__p0_535, __p1_535, __p2_535, __p3_535) __extension__ ({ \ 54003 int32x4_t __ret_535; \ 54004 int32x4_t __s0_535 = __p0_535; \ 54005 int16x4_t __s1_535 = __p1_535; \ 54006 int16x8_t __s2_535 = __p2_535; \ 54007 int32x4_t __rev0_535; __rev0_535 = __builtin_shufflevector(__s0_535, __s0_535, 3, 2, 1, 0); \ 54008 int16x4_t __rev1_535; __rev1_535 = __builtin_shufflevector(__s1_535, __s1_535, 3, 2, 1, 0); \ 54009 int16x8_t __rev2_535; __rev2_535 = __builtin_shufflevector(__s2_535, __s2_535, 7, 6, 5, 4, 3, 2, 1, 0); \ 54010 __ret_535 = __rev0_535 - __noswap_vmull_s16(__rev1_535, __noswap_splat_laneq_s16(__rev2_535, __p3_535)); \ 54011 __ret_535 = __builtin_shufflevector(__ret_535, __ret_535, 3, 2, 1, 0); \ 54012 __ret_535; \ 54013 }) 54014 #endif 54015 54016 __ai __attribute__((target("neon"))) poly64x1_t vmov_n_p64(poly64_t __p0) { 54017 poly64x1_t __ret; 54018 __ret = (poly64x1_t) {__p0}; 54019 return __ret; 54020 } 54021 #ifdef __LITTLE_ENDIAN__ 54022 __ai __attribute__((target("neon"))) poly64x2_t vmovq_n_p64(poly64_t __p0) { 54023 poly64x2_t __ret; 54024 __ret = (poly64x2_t) {__p0, __p0}; 54025 return __ret; 54026 } 54027 #else 54028 __ai __attribute__((target("neon"))) poly64x2_t vmovq_n_p64(poly64_t __p0) { 54029 poly64x2_t __ret; 54030 __ret = (poly64x2_t) {__p0, __p0}; 54031 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 54032 return __ret; 54033 } 54034 #endif 54035 54036 #ifdef __LITTLE_ENDIAN__ 54037 __ai __attribute__((target("neon"))) float64x2_t vmovq_n_f64(float64_t __p0) { 54038 float64x2_t __ret; 54039 __ret = (float64x2_t) {__p0, __p0}; 54040 return __ret; 54041 } 54042 #else 54043 __ai __attribute__((target("neon"))) float64x2_t vmovq_n_f64(float64_t __p0) { 54044 float64x2_t __ret; 54045 __ret = (float64x2_t) {__p0, __p0}; 54046 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 54047 return __ret; 54048 } 54049 #endif 54050 54051 __ai __attribute__((target("neon"))) float64x1_t vmov_n_f64(float64_t __p0) { 54052 float64x1_t __ret; 54053 __ret = (float64x1_t) {__p0}; 54054 return __ret; 54055 } 54056 #ifdef __LITTLE_ENDIAN__ 54057 __ai __attribute__((target("neon"))) uint16x8_t vmovl_high_u8(uint8x16_t __p0_536) { 54058 uint16x8_t __ret_536; 54059 uint8x8_t __a1_536 = vget_high_u8(__p0_536); 54060 __ret_536 = (uint16x8_t)(vshll_n_u8(__a1_536, 0)); 54061 return __ret_536; 54062 } 54063 #else 54064 __ai __attribute__((target("neon"))) uint16x8_t vmovl_high_u8(uint8x16_t __p0_537) { 54065 uint16x8_t __ret_537; 54066 uint8x16_t __rev0_537; __rev0_537 = __builtin_shufflevector(__p0_537, __p0_537, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 54067 uint8x8_t __a1_537 = __noswap_vget_high_u8(__rev0_537); 54068 __ret_537 = (uint16x8_t)(__noswap_vshll_n_u8(__a1_537, 0)); 54069 __ret_537 = __builtin_shufflevector(__ret_537, __ret_537, 7, 6, 5, 4, 3, 2, 1, 0); 54070 return __ret_537; 54071 } 54072 __ai __attribute__((target("neon"))) uint16x8_t __noswap_vmovl_high_u8(uint8x16_t __p0_538) { 54073 uint16x8_t __ret_538; 54074 uint8x8_t __a1_538 = __noswap_vget_high_u8(__p0_538); 54075 __ret_538 = (uint16x8_t)(__noswap_vshll_n_u8(__a1_538, 0)); 54076 return __ret_538; 54077 } 54078 #endif 54079 54080 #ifdef __LITTLE_ENDIAN__ 54081 __ai __attribute__((target("neon"))) uint64x2_t vmovl_high_u32(uint32x4_t __p0_539) { 54082 uint64x2_t __ret_539; 54083 uint32x2_t __a1_539 = vget_high_u32(__p0_539); 54084 __ret_539 = (uint64x2_t)(vshll_n_u32(__a1_539, 0)); 54085 return __ret_539; 54086 } 54087 #else 54088 __ai __attribute__((target("neon"))) uint64x2_t vmovl_high_u32(uint32x4_t __p0_540) { 54089 uint64x2_t __ret_540; 54090 uint32x4_t __rev0_540; __rev0_540 = __builtin_shufflevector(__p0_540, __p0_540, 3, 2, 1, 0); 54091 uint32x2_t __a1_540 = __noswap_vget_high_u32(__rev0_540); 54092 __ret_540 = (uint64x2_t)(__noswap_vshll_n_u32(__a1_540, 0)); 54093 __ret_540 = __builtin_shufflevector(__ret_540, __ret_540, 1, 0); 54094 return __ret_540; 54095 } 54096 __ai __attribute__((target("neon"))) uint64x2_t __noswap_vmovl_high_u32(uint32x4_t __p0_541) { 54097 uint64x2_t __ret_541; 54098 uint32x2_t __a1_541 = __noswap_vget_high_u32(__p0_541); 54099 __ret_541 = (uint64x2_t)(__noswap_vshll_n_u32(__a1_541, 0)); 54100 return __ret_541; 54101 } 54102 #endif 54103 54104 #ifdef __LITTLE_ENDIAN__ 54105 __ai __attribute__((target("neon"))) uint32x4_t vmovl_high_u16(uint16x8_t __p0_542) { 54106 uint32x4_t __ret_542; 54107 uint16x4_t __a1_542 = vget_high_u16(__p0_542); 54108 __ret_542 = (uint32x4_t)(vshll_n_u16(__a1_542, 0)); 54109 return __ret_542; 54110 } 54111 #else 54112 __ai __attribute__((target("neon"))) uint32x4_t vmovl_high_u16(uint16x8_t __p0_543) { 54113 uint32x4_t __ret_543; 54114 uint16x8_t __rev0_543; __rev0_543 = __builtin_shufflevector(__p0_543, __p0_543, 7, 6, 5, 4, 3, 2, 1, 0); 54115 uint16x4_t __a1_543 = __noswap_vget_high_u16(__rev0_543); 54116 __ret_543 = (uint32x4_t)(__noswap_vshll_n_u16(__a1_543, 0)); 54117 __ret_543 = __builtin_shufflevector(__ret_543, __ret_543, 3, 2, 1, 0); 54118 return __ret_543; 54119 } 54120 __ai __attribute__((target("neon"))) uint32x4_t __noswap_vmovl_high_u16(uint16x8_t __p0_544) { 54121 uint32x4_t __ret_544; 54122 uint16x4_t __a1_544 = __noswap_vget_high_u16(__p0_544); 54123 __ret_544 = (uint32x4_t)(__noswap_vshll_n_u16(__a1_544, 0)); 54124 return __ret_544; 54125 } 54126 #endif 54127 54128 #ifdef __LITTLE_ENDIAN__ 54129 __ai __attribute__((target("neon"))) int16x8_t vmovl_high_s8(int8x16_t __p0_545) { 54130 int16x8_t __ret_545; 54131 int8x8_t __a1_545 = vget_high_s8(__p0_545); 54132 __ret_545 = (int16x8_t)(vshll_n_s8(__a1_545, 0)); 54133 return __ret_545; 54134 } 54135 #else 54136 __ai __attribute__((target("neon"))) int16x8_t vmovl_high_s8(int8x16_t __p0_546) { 54137 int16x8_t __ret_546; 54138 int8x16_t __rev0_546; __rev0_546 = __builtin_shufflevector(__p0_546, __p0_546, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 54139 int8x8_t __a1_546 = __noswap_vget_high_s8(__rev0_546); 54140 __ret_546 = (int16x8_t)(__noswap_vshll_n_s8(__a1_546, 0)); 54141 __ret_546 = __builtin_shufflevector(__ret_546, __ret_546, 7, 6, 5, 4, 3, 2, 1, 0); 54142 return __ret_546; 54143 } 54144 __ai __attribute__((target("neon"))) int16x8_t __noswap_vmovl_high_s8(int8x16_t __p0_547) { 54145 int16x8_t __ret_547; 54146 int8x8_t __a1_547 = __noswap_vget_high_s8(__p0_547); 54147 __ret_547 = (int16x8_t)(__noswap_vshll_n_s8(__a1_547, 0)); 54148 return __ret_547; 54149 } 54150 #endif 54151 54152 #ifdef __LITTLE_ENDIAN__ 54153 __ai __attribute__((target("neon"))) int64x2_t vmovl_high_s32(int32x4_t __p0_548) { 54154 int64x2_t __ret_548; 54155 int32x2_t __a1_548 = vget_high_s32(__p0_548); 54156 __ret_548 = (int64x2_t)(vshll_n_s32(__a1_548, 0)); 54157 return __ret_548; 54158 } 54159 #else 54160 __ai __attribute__((target("neon"))) int64x2_t vmovl_high_s32(int32x4_t __p0_549) { 54161 int64x2_t __ret_549; 54162 int32x4_t __rev0_549; __rev0_549 = __builtin_shufflevector(__p0_549, __p0_549, 3, 2, 1, 0); 54163 int32x2_t __a1_549 = __noswap_vget_high_s32(__rev0_549); 54164 __ret_549 = (int64x2_t)(__noswap_vshll_n_s32(__a1_549, 0)); 54165 __ret_549 = __builtin_shufflevector(__ret_549, __ret_549, 1, 0); 54166 return __ret_549; 54167 } 54168 __ai __attribute__((target("neon"))) int64x2_t __noswap_vmovl_high_s32(int32x4_t __p0_550) { 54169 int64x2_t __ret_550; 54170 int32x2_t __a1_550 = __noswap_vget_high_s32(__p0_550); 54171 __ret_550 = (int64x2_t)(__noswap_vshll_n_s32(__a1_550, 0)); 54172 return __ret_550; 54173 } 54174 #endif 54175 54176 #ifdef __LITTLE_ENDIAN__ 54177 __ai __attribute__((target("neon"))) int32x4_t vmovl_high_s16(int16x8_t __p0_551) { 54178 int32x4_t __ret_551; 54179 int16x4_t __a1_551 = vget_high_s16(__p0_551); 54180 __ret_551 = (int32x4_t)(vshll_n_s16(__a1_551, 0)); 54181 return __ret_551; 54182 } 54183 #else 54184 __ai __attribute__((target("neon"))) int32x4_t vmovl_high_s16(int16x8_t __p0_552) { 54185 int32x4_t __ret_552; 54186 int16x8_t __rev0_552; __rev0_552 = __builtin_shufflevector(__p0_552, __p0_552, 7, 6, 5, 4, 3, 2, 1, 0); 54187 int16x4_t __a1_552 = __noswap_vget_high_s16(__rev0_552); 54188 __ret_552 = (int32x4_t)(__noswap_vshll_n_s16(__a1_552, 0)); 54189 __ret_552 = __builtin_shufflevector(__ret_552, __ret_552, 3, 2, 1, 0); 54190 return __ret_552; 54191 } 54192 __ai __attribute__((target("neon"))) int32x4_t __noswap_vmovl_high_s16(int16x8_t __p0_553) { 54193 int32x4_t __ret_553; 54194 int16x4_t __a1_553 = __noswap_vget_high_s16(__p0_553); 54195 __ret_553 = (int32x4_t)(__noswap_vshll_n_s16(__a1_553, 0)); 54196 return __ret_553; 54197 } 54198 #endif 54199 54200 #ifdef __LITTLE_ENDIAN__ 54201 __ai __attribute__((target("neon"))) uint16x8_t vmovn_high_u32(uint16x4_t __p0, uint32x4_t __p1) { 54202 uint16x8_t __ret; 54203 __ret = vcombine_u16(__p0, vmovn_u32(__p1)); 54204 return __ret; 54205 } 54206 #else 54207 __ai __attribute__((target("neon"))) uint16x8_t vmovn_high_u32(uint16x4_t __p0, uint32x4_t __p1) { 54208 uint16x8_t __ret; 54209 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 54210 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 54211 __ret = __noswap_vcombine_u16(__rev0, __noswap_vmovn_u32(__rev1)); 54212 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 54213 return __ret; 54214 } 54215 #endif 54216 54217 #ifdef __LITTLE_ENDIAN__ 54218 __ai __attribute__((target("neon"))) uint32x4_t vmovn_high_u64(uint32x2_t __p0, uint64x2_t __p1) { 54219 uint32x4_t __ret; 54220 __ret = vcombine_u32(__p0, vmovn_u64(__p1)); 54221 return __ret; 54222 } 54223 #else 54224 __ai __attribute__((target("neon"))) uint32x4_t vmovn_high_u64(uint32x2_t __p0, uint64x2_t __p1) { 54225 uint32x4_t __ret; 54226 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 54227 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 54228 __ret = __noswap_vcombine_u32(__rev0, __noswap_vmovn_u64(__rev1)); 54229 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 54230 return __ret; 54231 } 54232 #endif 54233 54234 #ifdef __LITTLE_ENDIAN__ 54235 __ai __attribute__((target("neon"))) uint8x16_t vmovn_high_u16(uint8x8_t __p0, uint16x8_t __p1) { 54236 uint8x16_t __ret; 54237 __ret = vcombine_u8(__p0, vmovn_u16(__p1)); 54238 return __ret; 54239 } 54240 #else 54241 __ai __attribute__((target("neon"))) uint8x16_t vmovn_high_u16(uint8x8_t __p0, uint16x8_t __p1) { 54242 uint8x16_t __ret; 54243 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 54244 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 54245 __ret = __noswap_vcombine_u8(__rev0, __noswap_vmovn_u16(__rev1)); 54246 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 54247 return __ret; 54248 } 54249 #endif 54250 54251 #ifdef __LITTLE_ENDIAN__ 54252 __ai __attribute__((target("neon"))) int16x8_t vmovn_high_s32(int16x4_t __p0, int32x4_t __p1) { 54253 int16x8_t __ret; 54254 __ret = vcombine_s16(__p0, vmovn_s32(__p1)); 54255 return __ret; 54256 } 54257 #else 54258 __ai __attribute__((target("neon"))) int16x8_t vmovn_high_s32(int16x4_t __p0, int32x4_t __p1) { 54259 int16x8_t __ret; 54260 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 54261 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 54262 __ret = __noswap_vcombine_s16(__rev0, __noswap_vmovn_s32(__rev1)); 54263 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 54264 return __ret; 54265 } 54266 #endif 54267 54268 #ifdef __LITTLE_ENDIAN__ 54269 __ai __attribute__((target("neon"))) int32x4_t vmovn_high_s64(int32x2_t __p0, int64x2_t __p1) { 54270 int32x4_t __ret; 54271 __ret = vcombine_s32(__p0, vmovn_s64(__p1)); 54272 return __ret; 54273 } 54274 #else 54275 __ai __attribute__((target("neon"))) int32x4_t vmovn_high_s64(int32x2_t __p0, int64x2_t __p1) { 54276 int32x4_t __ret; 54277 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 54278 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 54279 __ret = __noswap_vcombine_s32(__rev0, __noswap_vmovn_s64(__rev1)); 54280 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 54281 return __ret; 54282 } 54283 #endif 54284 54285 #ifdef __LITTLE_ENDIAN__ 54286 __ai __attribute__((target("neon"))) int8x16_t vmovn_high_s16(int8x8_t __p0, int16x8_t __p1) { 54287 int8x16_t __ret; 54288 __ret = vcombine_s8(__p0, vmovn_s16(__p1)); 54289 return __ret; 54290 } 54291 #else 54292 __ai __attribute__((target("neon"))) int8x16_t vmovn_high_s16(int8x8_t __p0, int16x8_t __p1) { 54293 int8x16_t __ret; 54294 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 54295 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 54296 __ret = __noswap_vcombine_s8(__rev0, __noswap_vmovn_s16(__rev1)); 54297 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 54298 return __ret; 54299 } 54300 #endif 54301 54302 #ifdef __LITTLE_ENDIAN__ 54303 __ai __attribute__((target("neon"))) float64x2_t vmulq_f64(float64x2_t __p0, float64x2_t __p1) { 54304 float64x2_t __ret; 54305 __ret = __p0 * __p1; 54306 return __ret; 54307 } 54308 #else 54309 __ai __attribute__((target("neon"))) float64x2_t vmulq_f64(float64x2_t __p0, float64x2_t __p1) { 54310 float64x2_t __ret; 54311 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 54312 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 54313 __ret = __rev0 * __rev1; 54314 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 54315 return __ret; 54316 } 54317 #endif 54318 54319 __ai __attribute__((target("neon"))) float64x1_t vmul_f64(float64x1_t __p0, float64x1_t __p1) { 54320 float64x1_t __ret; 54321 __ret = __p0 * __p1; 54322 return __ret; 54323 } 54324 #define vmuld_lane_f64(__p0_554, __p1_554, __p2_554) __extension__ ({ \ 54325 float64_t __ret_554; \ 54326 float64_t __s0_554 = __p0_554; \ 54327 float64x1_t __s1_554 = __p1_554; \ 54328 __ret_554 = __s0_554 * vget_lane_f64(__s1_554, __p2_554); \ 54329 __ret_554; \ 54330 }) 54331 #ifdef __LITTLE_ENDIAN__ 54332 #define vmuls_lane_f32(__p0_555, __p1_555, __p2_555) __extension__ ({ \ 54333 float32_t __ret_555; \ 54334 float32_t __s0_555 = __p0_555; \ 54335 float32x2_t __s1_555 = __p1_555; \ 54336 __ret_555 = __s0_555 * vget_lane_f32(__s1_555, __p2_555); \ 54337 __ret_555; \ 54338 }) 54339 #else 54340 #define vmuls_lane_f32(__p0_556, __p1_556, __p2_556) __extension__ ({ \ 54341 float32_t __ret_556; \ 54342 float32_t __s0_556 = __p0_556; \ 54343 float32x2_t __s1_556 = __p1_556; \ 54344 float32x2_t __rev1_556; __rev1_556 = __builtin_shufflevector(__s1_556, __s1_556, 1, 0); \ 54345 __ret_556 = __s0_556 * __noswap_vget_lane_f32(__rev1_556, __p2_556); \ 54346 __ret_556; \ 54347 }) 54348 #endif 54349 54350 #define vmul_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 54351 float64x1_t __ret; \ 54352 float64x1_t __s0 = __p0; \ 54353 float64x1_t __s1 = __p1; \ 54354 __ret = (float64x1_t) __builtin_neon_vmul_lane_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 10); \ 54355 __ret; \ 54356 }) 54357 #ifdef __LITTLE_ENDIAN__ 54358 #define vmulq_lane_f64(__p0_557, __p1_557, __p2_557) __extension__ ({ \ 54359 float64x2_t __ret_557; \ 54360 float64x2_t __s0_557 = __p0_557; \ 54361 float64x1_t __s1_557 = __p1_557; \ 54362 __ret_557 = __s0_557 * splatq_lane_f64(__s1_557, __p2_557); \ 54363 __ret_557; \ 54364 }) 54365 #else 54366 #define vmulq_lane_f64(__p0_558, __p1_558, __p2_558) __extension__ ({ \ 54367 float64x2_t __ret_558; \ 54368 float64x2_t __s0_558 = __p0_558; \ 54369 float64x1_t __s1_558 = __p1_558; \ 54370 float64x2_t __rev0_558; __rev0_558 = __builtin_shufflevector(__s0_558, __s0_558, 1, 0); \ 54371 __ret_558 = __rev0_558 * __noswap_splatq_lane_f64(__s1_558, __p2_558); \ 54372 __ret_558 = __builtin_shufflevector(__ret_558, __ret_558, 1, 0); \ 54373 __ret_558; \ 54374 }) 54375 #endif 54376 54377 #ifdef __LITTLE_ENDIAN__ 54378 #define vmuld_laneq_f64(__p0_559, __p1_559, __p2_559) __extension__ ({ \ 54379 float64_t __ret_559; \ 54380 float64_t __s0_559 = __p0_559; \ 54381 float64x2_t __s1_559 = __p1_559; \ 54382 __ret_559 = __s0_559 * vgetq_lane_f64(__s1_559, __p2_559); \ 54383 __ret_559; \ 54384 }) 54385 #else 54386 #define vmuld_laneq_f64(__p0_560, __p1_560, __p2_560) __extension__ ({ \ 54387 float64_t __ret_560; \ 54388 float64_t __s0_560 = __p0_560; \ 54389 float64x2_t __s1_560 = __p1_560; \ 54390 float64x2_t __rev1_560; __rev1_560 = __builtin_shufflevector(__s1_560, __s1_560, 1, 0); \ 54391 __ret_560 = __s0_560 * __noswap_vgetq_lane_f64(__rev1_560, __p2_560); \ 54392 __ret_560; \ 54393 }) 54394 #endif 54395 54396 #ifdef __LITTLE_ENDIAN__ 54397 #define vmuls_laneq_f32(__p0_561, __p1_561, __p2_561) __extension__ ({ \ 54398 float32_t __ret_561; \ 54399 float32_t __s0_561 = __p0_561; \ 54400 float32x4_t __s1_561 = __p1_561; \ 54401 __ret_561 = __s0_561 * vgetq_lane_f32(__s1_561, __p2_561); \ 54402 __ret_561; \ 54403 }) 54404 #else 54405 #define vmuls_laneq_f32(__p0_562, __p1_562, __p2_562) __extension__ ({ \ 54406 float32_t __ret_562; \ 54407 float32_t __s0_562 = __p0_562; \ 54408 float32x4_t __s1_562 = __p1_562; \ 54409 float32x4_t __rev1_562; __rev1_562 = __builtin_shufflevector(__s1_562, __s1_562, 3, 2, 1, 0); \ 54410 __ret_562 = __s0_562 * __noswap_vgetq_lane_f32(__rev1_562, __p2_562); \ 54411 __ret_562; \ 54412 }) 54413 #endif 54414 54415 #ifdef __LITTLE_ENDIAN__ 54416 #define vmul_laneq_f64(__p0, __p1, __p2) __extension__ ({ \ 54417 float64x1_t __ret; \ 54418 float64x1_t __s0 = __p0; \ 54419 float64x2_t __s1 = __p1; \ 54420 __ret = (float64x1_t) __builtin_neon_vmul_laneq_v((int8x8_t)__s0, (int8x16_t)__s1, __p2, 10); \ 54421 __ret; \ 54422 }) 54423 #else 54424 #define vmul_laneq_f64(__p0, __p1, __p2) __extension__ ({ \ 54425 float64x1_t __ret; \ 54426 float64x1_t __s0 = __p0; \ 54427 float64x2_t __s1 = __p1; \ 54428 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 54429 __ret = (float64x1_t) __builtin_neon_vmul_laneq_v((int8x8_t)__s0, (int8x16_t)__rev1, __p2, 10); \ 54430 __ret; \ 54431 }) 54432 #endif 54433 54434 #ifdef __LITTLE_ENDIAN__ 54435 #define vmulq_laneq_u32(__p0_563, __p1_563, __p2_563) __extension__ ({ \ 54436 uint32x4_t __ret_563; \ 54437 uint32x4_t __s0_563 = __p0_563; \ 54438 uint32x4_t __s1_563 = __p1_563; \ 54439 __ret_563 = __s0_563 * splatq_laneq_u32(__s1_563, __p2_563); \ 54440 __ret_563; \ 54441 }) 54442 #else 54443 #define vmulq_laneq_u32(__p0_564, __p1_564, __p2_564) __extension__ ({ \ 54444 uint32x4_t __ret_564; \ 54445 uint32x4_t __s0_564 = __p0_564; \ 54446 uint32x4_t __s1_564 = __p1_564; \ 54447 uint32x4_t __rev0_564; __rev0_564 = __builtin_shufflevector(__s0_564, __s0_564, 3, 2, 1, 0); \ 54448 uint32x4_t __rev1_564; __rev1_564 = __builtin_shufflevector(__s1_564, __s1_564, 3, 2, 1, 0); \ 54449 __ret_564 = __rev0_564 * __noswap_splatq_laneq_u32(__rev1_564, __p2_564); \ 54450 __ret_564 = __builtin_shufflevector(__ret_564, __ret_564, 3, 2, 1, 0); \ 54451 __ret_564; \ 54452 }) 54453 #endif 54454 54455 #ifdef __LITTLE_ENDIAN__ 54456 #define vmulq_laneq_u16(__p0_565, __p1_565, __p2_565) __extension__ ({ \ 54457 uint16x8_t __ret_565; \ 54458 uint16x8_t __s0_565 = __p0_565; \ 54459 uint16x8_t __s1_565 = __p1_565; \ 54460 __ret_565 = __s0_565 * splatq_laneq_u16(__s1_565, __p2_565); \ 54461 __ret_565; \ 54462 }) 54463 #else 54464 #define vmulq_laneq_u16(__p0_566, __p1_566, __p2_566) __extension__ ({ \ 54465 uint16x8_t __ret_566; \ 54466 uint16x8_t __s0_566 = __p0_566; \ 54467 uint16x8_t __s1_566 = __p1_566; \ 54468 uint16x8_t __rev0_566; __rev0_566 = __builtin_shufflevector(__s0_566, __s0_566, 7, 6, 5, 4, 3, 2, 1, 0); \ 54469 uint16x8_t __rev1_566; __rev1_566 = __builtin_shufflevector(__s1_566, __s1_566, 7, 6, 5, 4, 3, 2, 1, 0); \ 54470 __ret_566 = __rev0_566 * __noswap_splatq_laneq_u16(__rev1_566, __p2_566); \ 54471 __ret_566 = __builtin_shufflevector(__ret_566, __ret_566, 7, 6, 5, 4, 3, 2, 1, 0); \ 54472 __ret_566; \ 54473 }) 54474 #endif 54475 54476 #ifdef __LITTLE_ENDIAN__ 54477 #define vmulq_laneq_f64(__p0_567, __p1_567, __p2_567) __extension__ ({ \ 54478 float64x2_t __ret_567; \ 54479 float64x2_t __s0_567 = __p0_567; \ 54480 float64x2_t __s1_567 = __p1_567; \ 54481 __ret_567 = __s0_567 * splatq_laneq_f64(__s1_567, __p2_567); \ 54482 __ret_567; \ 54483 }) 54484 #else 54485 #define vmulq_laneq_f64(__p0_568, __p1_568, __p2_568) __extension__ ({ \ 54486 float64x2_t __ret_568; \ 54487 float64x2_t __s0_568 = __p0_568; \ 54488 float64x2_t __s1_568 = __p1_568; \ 54489 float64x2_t __rev0_568; __rev0_568 = __builtin_shufflevector(__s0_568, __s0_568, 1, 0); \ 54490 float64x2_t __rev1_568; __rev1_568 = __builtin_shufflevector(__s1_568, __s1_568, 1, 0); \ 54491 __ret_568 = __rev0_568 * __noswap_splatq_laneq_f64(__rev1_568, __p2_568); \ 54492 __ret_568 = __builtin_shufflevector(__ret_568, __ret_568, 1, 0); \ 54493 __ret_568; \ 54494 }) 54495 #endif 54496 54497 #ifdef __LITTLE_ENDIAN__ 54498 #define vmulq_laneq_f32(__p0_569, __p1_569, __p2_569) __extension__ ({ \ 54499 float32x4_t __ret_569; \ 54500 float32x4_t __s0_569 = __p0_569; \ 54501 float32x4_t __s1_569 = __p1_569; \ 54502 __ret_569 = __s0_569 * splatq_laneq_f32(__s1_569, __p2_569); \ 54503 __ret_569; \ 54504 }) 54505 #else 54506 #define vmulq_laneq_f32(__p0_570, __p1_570, __p2_570) __extension__ ({ \ 54507 float32x4_t __ret_570; \ 54508 float32x4_t __s0_570 = __p0_570; \ 54509 float32x4_t __s1_570 = __p1_570; \ 54510 float32x4_t __rev0_570; __rev0_570 = __builtin_shufflevector(__s0_570, __s0_570, 3, 2, 1, 0); \ 54511 float32x4_t __rev1_570; __rev1_570 = __builtin_shufflevector(__s1_570, __s1_570, 3, 2, 1, 0); \ 54512 __ret_570 = __rev0_570 * __noswap_splatq_laneq_f32(__rev1_570, __p2_570); \ 54513 __ret_570 = __builtin_shufflevector(__ret_570, __ret_570, 3, 2, 1, 0); \ 54514 __ret_570; \ 54515 }) 54516 #endif 54517 54518 #ifdef __LITTLE_ENDIAN__ 54519 #define vmulq_laneq_s32(__p0_571, __p1_571, __p2_571) __extension__ ({ \ 54520 int32x4_t __ret_571; \ 54521 int32x4_t __s0_571 = __p0_571; \ 54522 int32x4_t __s1_571 = __p1_571; \ 54523 __ret_571 = __s0_571 * splatq_laneq_s32(__s1_571, __p2_571); \ 54524 __ret_571; \ 54525 }) 54526 #else 54527 #define vmulq_laneq_s32(__p0_572, __p1_572, __p2_572) __extension__ ({ \ 54528 int32x4_t __ret_572; \ 54529 int32x4_t __s0_572 = __p0_572; \ 54530 int32x4_t __s1_572 = __p1_572; \ 54531 int32x4_t __rev0_572; __rev0_572 = __builtin_shufflevector(__s0_572, __s0_572, 3, 2, 1, 0); \ 54532 int32x4_t __rev1_572; __rev1_572 = __builtin_shufflevector(__s1_572, __s1_572, 3, 2, 1, 0); \ 54533 __ret_572 = __rev0_572 * __noswap_splatq_laneq_s32(__rev1_572, __p2_572); \ 54534 __ret_572 = __builtin_shufflevector(__ret_572, __ret_572, 3, 2, 1, 0); \ 54535 __ret_572; \ 54536 }) 54537 #endif 54538 54539 #ifdef __LITTLE_ENDIAN__ 54540 #define vmulq_laneq_s16(__p0_573, __p1_573, __p2_573) __extension__ ({ \ 54541 int16x8_t __ret_573; \ 54542 int16x8_t __s0_573 = __p0_573; \ 54543 int16x8_t __s1_573 = __p1_573; \ 54544 __ret_573 = __s0_573 * splatq_laneq_s16(__s1_573, __p2_573); \ 54545 __ret_573; \ 54546 }) 54547 #else 54548 #define vmulq_laneq_s16(__p0_574, __p1_574, __p2_574) __extension__ ({ \ 54549 int16x8_t __ret_574; \ 54550 int16x8_t __s0_574 = __p0_574; \ 54551 int16x8_t __s1_574 = __p1_574; \ 54552 int16x8_t __rev0_574; __rev0_574 = __builtin_shufflevector(__s0_574, __s0_574, 7, 6, 5, 4, 3, 2, 1, 0); \ 54553 int16x8_t __rev1_574; __rev1_574 = __builtin_shufflevector(__s1_574, __s1_574, 7, 6, 5, 4, 3, 2, 1, 0); \ 54554 __ret_574 = __rev0_574 * __noswap_splatq_laneq_s16(__rev1_574, __p2_574); \ 54555 __ret_574 = __builtin_shufflevector(__ret_574, __ret_574, 7, 6, 5, 4, 3, 2, 1, 0); \ 54556 __ret_574; \ 54557 }) 54558 #endif 54559 54560 #ifdef __LITTLE_ENDIAN__ 54561 #define vmul_laneq_u32(__p0_575, __p1_575, __p2_575) __extension__ ({ \ 54562 uint32x2_t __ret_575; \ 54563 uint32x2_t __s0_575 = __p0_575; \ 54564 uint32x4_t __s1_575 = __p1_575; \ 54565 __ret_575 = __s0_575 * splat_laneq_u32(__s1_575, __p2_575); \ 54566 __ret_575; \ 54567 }) 54568 #else 54569 #define vmul_laneq_u32(__p0_576, __p1_576, __p2_576) __extension__ ({ \ 54570 uint32x2_t __ret_576; \ 54571 uint32x2_t __s0_576 = __p0_576; \ 54572 uint32x4_t __s1_576 = __p1_576; \ 54573 uint32x2_t __rev0_576; __rev0_576 = __builtin_shufflevector(__s0_576, __s0_576, 1, 0); \ 54574 uint32x4_t __rev1_576; __rev1_576 = __builtin_shufflevector(__s1_576, __s1_576, 3, 2, 1, 0); \ 54575 __ret_576 = __rev0_576 * __noswap_splat_laneq_u32(__rev1_576, __p2_576); \ 54576 __ret_576 = __builtin_shufflevector(__ret_576, __ret_576, 1, 0); \ 54577 __ret_576; \ 54578 }) 54579 #endif 54580 54581 #ifdef __LITTLE_ENDIAN__ 54582 #define vmul_laneq_u16(__p0_577, __p1_577, __p2_577) __extension__ ({ \ 54583 uint16x4_t __ret_577; \ 54584 uint16x4_t __s0_577 = __p0_577; \ 54585 uint16x8_t __s1_577 = __p1_577; \ 54586 __ret_577 = __s0_577 * splat_laneq_u16(__s1_577, __p2_577); \ 54587 __ret_577; \ 54588 }) 54589 #else 54590 #define vmul_laneq_u16(__p0_578, __p1_578, __p2_578) __extension__ ({ \ 54591 uint16x4_t __ret_578; \ 54592 uint16x4_t __s0_578 = __p0_578; \ 54593 uint16x8_t __s1_578 = __p1_578; \ 54594 uint16x4_t __rev0_578; __rev0_578 = __builtin_shufflevector(__s0_578, __s0_578, 3, 2, 1, 0); \ 54595 uint16x8_t __rev1_578; __rev1_578 = __builtin_shufflevector(__s1_578, __s1_578, 7, 6, 5, 4, 3, 2, 1, 0); \ 54596 __ret_578 = __rev0_578 * __noswap_splat_laneq_u16(__rev1_578, __p2_578); \ 54597 __ret_578 = __builtin_shufflevector(__ret_578, __ret_578, 3, 2, 1, 0); \ 54598 __ret_578; \ 54599 }) 54600 #endif 54601 54602 #ifdef __LITTLE_ENDIAN__ 54603 #define vmul_laneq_f32(__p0_579, __p1_579, __p2_579) __extension__ ({ \ 54604 float32x2_t __ret_579; \ 54605 float32x2_t __s0_579 = __p0_579; \ 54606 float32x4_t __s1_579 = __p1_579; \ 54607 __ret_579 = __s0_579 * splat_laneq_f32(__s1_579, __p2_579); \ 54608 __ret_579; \ 54609 }) 54610 #else 54611 #define vmul_laneq_f32(__p0_580, __p1_580, __p2_580) __extension__ ({ \ 54612 float32x2_t __ret_580; \ 54613 float32x2_t __s0_580 = __p0_580; \ 54614 float32x4_t __s1_580 = __p1_580; \ 54615 float32x2_t __rev0_580; __rev0_580 = __builtin_shufflevector(__s0_580, __s0_580, 1, 0); \ 54616 float32x4_t __rev1_580; __rev1_580 = __builtin_shufflevector(__s1_580, __s1_580, 3, 2, 1, 0); \ 54617 __ret_580 = __rev0_580 * __noswap_splat_laneq_f32(__rev1_580, __p2_580); \ 54618 __ret_580 = __builtin_shufflevector(__ret_580, __ret_580, 1, 0); \ 54619 __ret_580; \ 54620 }) 54621 #endif 54622 54623 #ifdef __LITTLE_ENDIAN__ 54624 #define vmul_laneq_s32(__p0_581, __p1_581, __p2_581) __extension__ ({ \ 54625 int32x2_t __ret_581; \ 54626 int32x2_t __s0_581 = __p0_581; \ 54627 int32x4_t __s1_581 = __p1_581; \ 54628 __ret_581 = __s0_581 * splat_laneq_s32(__s1_581, __p2_581); \ 54629 __ret_581; \ 54630 }) 54631 #else 54632 #define vmul_laneq_s32(__p0_582, __p1_582, __p2_582) __extension__ ({ \ 54633 int32x2_t __ret_582; \ 54634 int32x2_t __s0_582 = __p0_582; \ 54635 int32x4_t __s1_582 = __p1_582; \ 54636 int32x2_t __rev0_582; __rev0_582 = __builtin_shufflevector(__s0_582, __s0_582, 1, 0); \ 54637 int32x4_t __rev1_582; __rev1_582 = __builtin_shufflevector(__s1_582, __s1_582, 3, 2, 1, 0); \ 54638 __ret_582 = __rev0_582 * __noswap_splat_laneq_s32(__rev1_582, __p2_582); \ 54639 __ret_582 = __builtin_shufflevector(__ret_582, __ret_582, 1, 0); \ 54640 __ret_582; \ 54641 }) 54642 #endif 54643 54644 #ifdef __LITTLE_ENDIAN__ 54645 #define vmul_laneq_s16(__p0_583, __p1_583, __p2_583) __extension__ ({ \ 54646 int16x4_t __ret_583; \ 54647 int16x4_t __s0_583 = __p0_583; \ 54648 int16x8_t __s1_583 = __p1_583; \ 54649 __ret_583 = __s0_583 * splat_laneq_s16(__s1_583, __p2_583); \ 54650 __ret_583; \ 54651 }) 54652 #else 54653 #define vmul_laneq_s16(__p0_584, __p1_584, __p2_584) __extension__ ({ \ 54654 int16x4_t __ret_584; \ 54655 int16x4_t __s0_584 = __p0_584; \ 54656 int16x8_t __s1_584 = __p1_584; \ 54657 int16x4_t __rev0_584; __rev0_584 = __builtin_shufflevector(__s0_584, __s0_584, 3, 2, 1, 0); \ 54658 int16x8_t __rev1_584; __rev1_584 = __builtin_shufflevector(__s1_584, __s1_584, 7, 6, 5, 4, 3, 2, 1, 0); \ 54659 __ret_584 = __rev0_584 * __noswap_splat_laneq_s16(__rev1_584, __p2_584); \ 54660 __ret_584 = __builtin_shufflevector(__ret_584, __ret_584, 3, 2, 1, 0); \ 54661 __ret_584; \ 54662 }) 54663 #endif 54664 54665 __ai __attribute__((target("neon"))) float64x1_t vmul_n_f64(float64x1_t __p0, float64_t __p1) { 54666 float64x1_t __ret; 54667 __ret = (float64x1_t) __builtin_neon_vmul_n_f64((float64x1_t)__p0, __p1); 54668 return __ret; 54669 } 54670 #ifdef __LITTLE_ENDIAN__ 54671 __ai __attribute__((target("neon"))) float64x2_t vmulq_n_f64(float64x2_t __p0, float64_t __p1) { 54672 float64x2_t __ret; 54673 __ret = __p0 * (float64x2_t) {__p1, __p1}; 54674 return __ret; 54675 } 54676 #else 54677 __ai __attribute__((target("neon"))) float64x2_t vmulq_n_f64(float64x2_t __p0, float64_t __p1) { 54678 float64x2_t __ret; 54679 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 54680 __ret = __rev0 * (float64x2_t) {__p1, __p1}; 54681 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 54682 return __ret; 54683 } 54684 #endif 54685 54686 #ifdef __LITTLE_ENDIAN__ 54687 __ai __attribute__((target("neon"))) poly16x8_t vmull_high_p8(poly8x16_t __p0, poly8x16_t __p1) { 54688 poly16x8_t __ret; 54689 __ret = vmull_p8(vget_high_p8(__p0), vget_high_p8(__p1)); 54690 return __ret; 54691 } 54692 #else 54693 __ai __attribute__((target("neon"))) poly16x8_t vmull_high_p8(poly8x16_t __p0, poly8x16_t __p1) { 54694 poly16x8_t __ret; 54695 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 54696 poly8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 54697 __ret = __noswap_vmull_p8(__noswap_vget_high_p8(__rev0), __noswap_vget_high_p8(__rev1)); 54698 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 54699 return __ret; 54700 } 54701 #endif 54702 54703 #ifdef __LITTLE_ENDIAN__ 54704 __ai __attribute__((target("neon"))) uint16x8_t vmull_high_u8(uint8x16_t __p0, uint8x16_t __p1) { 54705 uint16x8_t __ret; 54706 __ret = vmull_u8(vget_high_u8(__p0), vget_high_u8(__p1)); 54707 return __ret; 54708 } 54709 #else 54710 __ai __attribute__((target("neon"))) uint16x8_t vmull_high_u8(uint8x16_t __p0, uint8x16_t __p1) { 54711 uint16x8_t __ret; 54712 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 54713 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 54714 __ret = __noswap_vmull_u8(__noswap_vget_high_u8(__rev0), __noswap_vget_high_u8(__rev1)); 54715 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 54716 return __ret; 54717 } 54718 #endif 54719 54720 #ifdef __LITTLE_ENDIAN__ 54721 __ai __attribute__((target("neon"))) uint64x2_t vmull_high_u32(uint32x4_t __p0, uint32x4_t __p1) { 54722 uint64x2_t __ret; 54723 __ret = vmull_u32(vget_high_u32(__p0), vget_high_u32(__p1)); 54724 return __ret; 54725 } 54726 #else 54727 __ai __attribute__((target("neon"))) uint64x2_t vmull_high_u32(uint32x4_t __p0, uint32x4_t __p1) { 54728 uint64x2_t __ret; 54729 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 54730 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 54731 __ret = __noswap_vmull_u32(__noswap_vget_high_u32(__rev0), __noswap_vget_high_u32(__rev1)); 54732 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 54733 return __ret; 54734 } 54735 #endif 54736 54737 #ifdef __LITTLE_ENDIAN__ 54738 __ai __attribute__((target("neon"))) uint32x4_t vmull_high_u16(uint16x8_t __p0, uint16x8_t __p1) { 54739 uint32x4_t __ret; 54740 __ret = vmull_u16(vget_high_u16(__p0), vget_high_u16(__p1)); 54741 return __ret; 54742 } 54743 #else 54744 __ai __attribute__((target("neon"))) uint32x4_t vmull_high_u16(uint16x8_t __p0, uint16x8_t __p1) { 54745 uint32x4_t __ret; 54746 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 54747 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 54748 __ret = __noswap_vmull_u16(__noswap_vget_high_u16(__rev0), __noswap_vget_high_u16(__rev1)); 54749 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 54750 return __ret; 54751 } 54752 #endif 54753 54754 #ifdef __LITTLE_ENDIAN__ 54755 __ai __attribute__((target("neon"))) int16x8_t vmull_high_s8(int8x16_t __p0, int8x16_t __p1) { 54756 int16x8_t __ret; 54757 __ret = vmull_s8(vget_high_s8(__p0), vget_high_s8(__p1)); 54758 return __ret; 54759 } 54760 #else 54761 __ai __attribute__((target("neon"))) int16x8_t vmull_high_s8(int8x16_t __p0, int8x16_t __p1) { 54762 int16x8_t __ret; 54763 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 54764 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 54765 __ret = __noswap_vmull_s8(__noswap_vget_high_s8(__rev0), __noswap_vget_high_s8(__rev1)); 54766 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 54767 return __ret; 54768 } 54769 #endif 54770 54771 #ifdef __LITTLE_ENDIAN__ 54772 __ai __attribute__((target("neon"))) int64x2_t vmull_high_s32(int32x4_t __p0, int32x4_t __p1) { 54773 int64x2_t __ret; 54774 __ret = vmull_s32(vget_high_s32(__p0), vget_high_s32(__p1)); 54775 return __ret; 54776 } 54777 #else 54778 __ai __attribute__((target("neon"))) int64x2_t vmull_high_s32(int32x4_t __p0, int32x4_t __p1) { 54779 int64x2_t __ret; 54780 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 54781 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 54782 __ret = __noswap_vmull_s32(__noswap_vget_high_s32(__rev0), __noswap_vget_high_s32(__rev1)); 54783 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 54784 return __ret; 54785 } 54786 #endif 54787 54788 #ifdef __LITTLE_ENDIAN__ 54789 __ai __attribute__((target("neon"))) int32x4_t vmull_high_s16(int16x8_t __p0, int16x8_t __p1) { 54790 int32x4_t __ret; 54791 __ret = vmull_s16(vget_high_s16(__p0), vget_high_s16(__p1)); 54792 return __ret; 54793 } 54794 #else 54795 __ai __attribute__((target("neon"))) int32x4_t vmull_high_s16(int16x8_t __p0, int16x8_t __p1) { 54796 int32x4_t __ret; 54797 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 54798 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 54799 __ret = __noswap_vmull_s16(__noswap_vget_high_s16(__rev0), __noswap_vget_high_s16(__rev1)); 54800 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 54801 return __ret; 54802 } 54803 #endif 54804 54805 #ifdef __LITTLE_ENDIAN__ 54806 #define vmull_high_lane_u32(__p0_585, __p1_585, __p2_585) __extension__ ({ \ 54807 uint64x2_t __ret_585; \ 54808 uint32x4_t __s0_585 = __p0_585; \ 54809 uint32x2_t __s1_585 = __p1_585; \ 54810 __ret_585 = vmull_u32(vget_high_u32(__s0_585), splat_lane_u32(__s1_585, __p2_585)); \ 54811 __ret_585; \ 54812 }) 54813 #else 54814 #define vmull_high_lane_u32(__p0_586, __p1_586, __p2_586) __extension__ ({ \ 54815 uint64x2_t __ret_586; \ 54816 uint32x4_t __s0_586 = __p0_586; \ 54817 uint32x2_t __s1_586 = __p1_586; \ 54818 uint32x4_t __rev0_586; __rev0_586 = __builtin_shufflevector(__s0_586, __s0_586, 3, 2, 1, 0); \ 54819 uint32x2_t __rev1_586; __rev1_586 = __builtin_shufflevector(__s1_586, __s1_586, 1, 0); \ 54820 __ret_586 = __noswap_vmull_u32(__noswap_vget_high_u32(__rev0_586), __noswap_splat_lane_u32(__rev1_586, __p2_586)); \ 54821 __ret_586 = __builtin_shufflevector(__ret_586, __ret_586, 1, 0); \ 54822 __ret_586; \ 54823 }) 54824 #endif 54825 54826 #ifdef __LITTLE_ENDIAN__ 54827 #define vmull_high_lane_u16(__p0_587, __p1_587, __p2_587) __extension__ ({ \ 54828 uint32x4_t __ret_587; \ 54829 uint16x8_t __s0_587 = __p0_587; \ 54830 uint16x4_t __s1_587 = __p1_587; \ 54831 __ret_587 = vmull_u16(vget_high_u16(__s0_587), splat_lane_u16(__s1_587, __p2_587)); \ 54832 __ret_587; \ 54833 }) 54834 #else 54835 #define vmull_high_lane_u16(__p0_588, __p1_588, __p2_588) __extension__ ({ \ 54836 uint32x4_t __ret_588; \ 54837 uint16x8_t __s0_588 = __p0_588; \ 54838 uint16x4_t __s1_588 = __p1_588; \ 54839 uint16x8_t __rev0_588; __rev0_588 = __builtin_shufflevector(__s0_588, __s0_588, 7, 6, 5, 4, 3, 2, 1, 0); \ 54840 uint16x4_t __rev1_588; __rev1_588 = __builtin_shufflevector(__s1_588, __s1_588, 3, 2, 1, 0); \ 54841 __ret_588 = __noswap_vmull_u16(__noswap_vget_high_u16(__rev0_588), __noswap_splat_lane_u16(__rev1_588, __p2_588)); \ 54842 __ret_588 = __builtin_shufflevector(__ret_588, __ret_588, 3, 2, 1, 0); \ 54843 __ret_588; \ 54844 }) 54845 #endif 54846 54847 #ifdef __LITTLE_ENDIAN__ 54848 #define vmull_high_lane_s32(__p0_589, __p1_589, __p2_589) __extension__ ({ \ 54849 int64x2_t __ret_589; \ 54850 int32x4_t __s0_589 = __p0_589; \ 54851 int32x2_t __s1_589 = __p1_589; \ 54852 __ret_589 = vmull_s32(vget_high_s32(__s0_589), splat_lane_s32(__s1_589, __p2_589)); \ 54853 __ret_589; \ 54854 }) 54855 #else 54856 #define vmull_high_lane_s32(__p0_590, __p1_590, __p2_590) __extension__ ({ \ 54857 int64x2_t __ret_590; \ 54858 int32x4_t __s0_590 = __p0_590; \ 54859 int32x2_t __s1_590 = __p1_590; \ 54860 int32x4_t __rev0_590; __rev0_590 = __builtin_shufflevector(__s0_590, __s0_590, 3, 2, 1, 0); \ 54861 int32x2_t __rev1_590; __rev1_590 = __builtin_shufflevector(__s1_590, __s1_590, 1, 0); \ 54862 __ret_590 = __noswap_vmull_s32(__noswap_vget_high_s32(__rev0_590), __noswap_splat_lane_s32(__rev1_590, __p2_590)); \ 54863 __ret_590 = __builtin_shufflevector(__ret_590, __ret_590, 1, 0); \ 54864 __ret_590; \ 54865 }) 54866 #endif 54867 54868 #ifdef __LITTLE_ENDIAN__ 54869 #define vmull_high_lane_s16(__p0_591, __p1_591, __p2_591) __extension__ ({ \ 54870 int32x4_t __ret_591; \ 54871 int16x8_t __s0_591 = __p0_591; \ 54872 int16x4_t __s1_591 = __p1_591; \ 54873 __ret_591 = vmull_s16(vget_high_s16(__s0_591), splat_lane_s16(__s1_591, __p2_591)); \ 54874 __ret_591; \ 54875 }) 54876 #else 54877 #define vmull_high_lane_s16(__p0_592, __p1_592, __p2_592) __extension__ ({ \ 54878 int32x4_t __ret_592; \ 54879 int16x8_t __s0_592 = __p0_592; \ 54880 int16x4_t __s1_592 = __p1_592; \ 54881 int16x8_t __rev0_592; __rev0_592 = __builtin_shufflevector(__s0_592, __s0_592, 7, 6, 5, 4, 3, 2, 1, 0); \ 54882 int16x4_t __rev1_592; __rev1_592 = __builtin_shufflevector(__s1_592, __s1_592, 3, 2, 1, 0); \ 54883 __ret_592 = __noswap_vmull_s16(__noswap_vget_high_s16(__rev0_592), __noswap_splat_lane_s16(__rev1_592, __p2_592)); \ 54884 __ret_592 = __builtin_shufflevector(__ret_592, __ret_592, 3, 2, 1, 0); \ 54885 __ret_592; \ 54886 }) 54887 #endif 54888 54889 #ifdef __LITTLE_ENDIAN__ 54890 #define vmull_high_laneq_u32(__p0_593, __p1_593, __p2_593) __extension__ ({ \ 54891 uint64x2_t __ret_593; \ 54892 uint32x4_t __s0_593 = __p0_593; \ 54893 uint32x4_t __s1_593 = __p1_593; \ 54894 __ret_593 = vmull_u32(vget_high_u32(__s0_593), splat_laneq_u32(__s1_593, __p2_593)); \ 54895 __ret_593; \ 54896 }) 54897 #else 54898 #define vmull_high_laneq_u32(__p0_594, __p1_594, __p2_594) __extension__ ({ \ 54899 uint64x2_t __ret_594; \ 54900 uint32x4_t __s0_594 = __p0_594; \ 54901 uint32x4_t __s1_594 = __p1_594; \ 54902 uint32x4_t __rev0_594; __rev0_594 = __builtin_shufflevector(__s0_594, __s0_594, 3, 2, 1, 0); \ 54903 uint32x4_t __rev1_594; __rev1_594 = __builtin_shufflevector(__s1_594, __s1_594, 3, 2, 1, 0); \ 54904 __ret_594 = __noswap_vmull_u32(__noswap_vget_high_u32(__rev0_594), __noswap_splat_laneq_u32(__rev1_594, __p2_594)); \ 54905 __ret_594 = __builtin_shufflevector(__ret_594, __ret_594, 1, 0); \ 54906 __ret_594; \ 54907 }) 54908 #endif 54909 54910 #ifdef __LITTLE_ENDIAN__ 54911 #define vmull_high_laneq_u16(__p0_595, __p1_595, __p2_595) __extension__ ({ \ 54912 uint32x4_t __ret_595; \ 54913 uint16x8_t __s0_595 = __p0_595; \ 54914 uint16x8_t __s1_595 = __p1_595; \ 54915 __ret_595 = vmull_u16(vget_high_u16(__s0_595), splat_laneq_u16(__s1_595, __p2_595)); \ 54916 __ret_595; \ 54917 }) 54918 #else 54919 #define vmull_high_laneq_u16(__p0_596, __p1_596, __p2_596) __extension__ ({ \ 54920 uint32x4_t __ret_596; \ 54921 uint16x8_t __s0_596 = __p0_596; \ 54922 uint16x8_t __s1_596 = __p1_596; \ 54923 uint16x8_t __rev0_596; __rev0_596 = __builtin_shufflevector(__s0_596, __s0_596, 7, 6, 5, 4, 3, 2, 1, 0); \ 54924 uint16x8_t __rev1_596; __rev1_596 = __builtin_shufflevector(__s1_596, __s1_596, 7, 6, 5, 4, 3, 2, 1, 0); \ 54925 __ret_596 = __noswap_vmull_u16(__noswap_vget_high_u16(__rev0_596), __noswap_splat_laneq_u16(__rev1_596, __p2_596)); \ 54926 __ret_596 = __builtin_shufflevector(__ret_596, __ret_596, 3, 2, 1, 0); \ 54927 __ret_596; \ 54928 }) 54929 #endif 54930 54931 #ifdef __LITTLE_ENDIAN__ 54932 #define vmull_high_laneq_s32(__p0_597, __p1_597, __p2_597) __extension__ ({ \ 54933 int64x2_t __ret_597; \ 54934 int32x4_t __s0_597 = __p0_597; \ 54935 int32x4_t __s1_597 = __p1_597; \ 54936 __ret_597 = vmull_s32(vget_high_s32(__s0_597), splat_laneq_s32(__s1_597, __p2_597)); \ 54937 __ret_597; \ 54938 }) 54939 #else 54940 #define vmull_high_laneq_s32(__p0_598, __p1_598, __p2_598) __extension__ ({ \ 54941 int64x2_t __ret_598; \ 54942 int32x4_t __s0_598 = __p0_598; \ 54943 int32x4_t __s1_598 = __p1_598; \ 54944 int32x4_t __rev0_598; __rev0_598 = __builtin_shufflevector(__s0_598, __s0_598, 3, 2, 1, 0); \ 54945 int32x4_t __rev1_598; __rev1_598 = __builtin_shufflevector(__s1_598, __s1_598, 3, 2, 1, 0); \ 54946 __ret_598 = __noswap_vmull_s32(__noswap_vget_high_s32(__rev0_598), __noswap_splat_laneq_s32(__rev1_598, __p2_598)); \ 54947 __ret_598 = __builtin_shufflevector(__ret_598, __ret_598, 1, 0); \ 54948 __ret_598; \ 54949 }) 54950 #endif 54951 54952 #ifdef __LITTLE_ENDIAN__ 54953 #define vmull_high_laneq_s16(__p0_599, __p1_599, __p2_599) __extension__ ({ \ 54954 int32x4_t __ret_599; \ 54955 int16x8_t __s0_599 = __p0_599; \ 54956 int16x8_t __s1_599 = __p1_599; \ 54957 __ret_599 = vmull_s16(vget_high_s16(__s0_599), splat_laneq_s16(__s1_599, __p2_599)); \ 54958 __ret_599; \ 54959 }) 54960 #else 54961 #define vmull_high_laneq_s16(__p0_600, __p1_600, __p2_600) __extension__ ({ \ 54962 int32x4_t __ret_600; \ 54963 int16x8_t __s0_600 = __p0_600; \ 54964 int16x8_t __s1_600 = __p1_600; \ 54965 int16x8_t __rev0_600; __rev0_600 = __builtin_shufflevector(__s0_600, __s0_600, 7, 6, 5, 4, 3, 2, 1, 0); \ 54966 int16x8_t __rev1_600; __rev1_600 = __builtin_shufflevector(__s1_600, __s1_600, 7, 6, 5, 4, 3, 2, 1, 0); \ 54967 __ret_600 = __noswap_vmull_s16(__noswap_vget_high_s16(__rev0_600), __noswap_splat_laneq_s16(__rev1_600, __p2_600)); \ 54968 __ret_600 = __builtin_shufflevector(__ret_600, __ret_600, 3, 2, 1, 0); \ 54969 __ret_600; \ 54970 }) 54971 #endif 54972 54973 #ifdef __LITTLE_ENDIAN__ 54974 __ai __attribute__((target("neon"))) uint64x2_t vmull_high_n_u32(uint32x4_t __p0, uint32_t __p1) { 54975 uint64x2_t __ret; 54976 __ret = vmull_n_u32(vget_high_u32(__p0), __p1); 54977 return __ret; 54978 } 54979 #else 54980 __ai __attribute__((target("neon"))) uint64x2_t vmull_high_n_u32(uint32x4_t __p0, uint32_t __p1) { 54981 uint64x2_t __ret; 54982 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 54983 __ret = __noswap_vmull_n_u32(__noswap_vget_high_u32(__rev0), __p1); 54984 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 54985 return __ret; 54986 } 54987 #endif 54988 54989 #ifdef __LITTLE_ENDIAN__ 54990 __ai __attribute__((target("neon"))) uint32x4_t vmull_high_n_u16(uint16x8_t __p0, uint16_t __p1) { 54991 uint32x4_t __ret; 54992 __ret = vmull_n_u16(vget_high_u16(__p0), __p1); 54993 return __ret; 54994 } 54995 #else 54996 __ai __attribute__((target("neon"))) uint32x4_t vmull_high_n_u16(uint16x8_t __p0, uint16_t __p1) { 54997 uint32x4_t __ret; 54998 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 54999 __ret = __noswap_vmull_n_u16(__noswap_vget_high_u16(__rev0), __p1); 55000 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 55001 return __ret; 55002 } 55003 #endif 55004 55005 #ifdef __LITTLE_ENDIAN__ 55006 __ai __attribute__((target("neon"))) int64x2_t vmull_high_n_s32(int32x4_t __p0, int32_t __p1) { 55007 int64x2_t __ret; 55008 __ret = vmull_n_s32(vget_high_s32(__p0), __p1); 55009 return __ret; 55010 } 55011 #else 55012 __ai __attribute__((target("neon"))) int64x2_t vmull_high_n_s32(int32x4_t __p0, int32_t __p1) { 55013 int64x2_t __ret; 55014 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 55015 __ret = __noswap_vmull_n_s32(__noswap_vget_high_s32(__rev0), __p1); 55016 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 55017 return __ret; 55018 } 55019 #endif 55020 55021 #ifdef __LITTLE_ENDIAN__ 55022 __ai __attribute__((target("neon"))) int32x4_t vmull_high_n_s16(int16x8_t __p0, int16_t __p1) { 55023 int32x4_t __ret; 55024 __ret = vmull_n_s16(vget_high_s16(__p0), __p1); 55025 return __ret; 55026 } 55027 #else 55028 __ai __attribute__((target("neon"))) int32x4_t vmull_high_n_s16(int16x8_t __p0, int16_t __p1) { 55029 int32x4_t __ret; 55030 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 55031 __ret = __noswap_vmull_n_s16(__noswap_vget_high_s16(__rev0), __p1); 55032 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 55033 return __ret; 55034 } 55035 #endif 55036 55037 #ifdef __LITTLE_ENDIAN__ 55038 #define vmull_laneq_u32(__p0_601, __p1_601, __p2_601) __extension__ ({ \ 55039 uint64x2_t __ret_601; \ 55040 uint32x2_t __s0_601 = __p0_601; \ 55041 uint32x4_t __s1_601 = __p1_601; \ 55042 __ret_601 = vmull_u32(__s0_601, splat_laneq_u32(__s1_601, __p2_601)); \ 55043 __ret_601; \ 55044 }) 55045 #else 55046 #define vmull_laneq_u32(__p0_602, __p1_602, __p2_602) __extension__ ({ \ 55047 uint64x2_t __ret_602; \ 55048 uint32x2_t __s0_602 = __p0_602; \ 55049 uint32x4_t __s1_602 = __p1_602; \ 55050 uint32x2_t __rev0_602; __rev0_602 = __builtin_shufflevector(__s0_602, __s0_602, 1, 0); \ 55051 uint32x4_t __rev1_602; __rev1_602 = __builtin_shufflevector(__s1_602, __s1_602, 3, 2, 1, 0); \ 55052 __ret_602 = __noswap_vmull_u32(__rev0_602, __noswap_splat_laneq_u32(__rev1_602, __p2_602)); \ 55053 __ret_602 = __builtin_shufflevector(__ret_602, __ret_602, 1, 0); \ 55054 __ret_602; \ 55055 }) 55056 #endif 55057 55058 #ifdef __LITTLE_ENDIAN__ 55059 #define vmull_laneq_u16(__p0_603, __p1_603, __p2_603) __extension__ ({ \ 55060 uint32x4_t __ret_603; \ 55061 uint16x4_t __s0_603 = __p0_603; \ 55062 uint16x8_t __s1_603 = __p1_603; \ 55063 __ret_603 = vmull_u16(__s0_603, splat_laneq_u16(__s1_603, __p2_603)); \ 55064 __ret_603; \ 55065 }) 55066 #else 55067 #define vmull_laneq_u16(__p0_604, __p1_604, __p2_604) __extension__ ({ \ 55068 uint32x4_t __ret_604; \ 55069 uint16x4_t __s0_604 = __p0_604; \ 55070 uint16x8_t __s1_604 = __p1_604; \ 55071 uint16x4_t __rev0_604; __rev0_604 = __builtin_shufflevector(__s0_604, __s0_604, 3, 2, 1, 0); \ 55072 uint16x8_t __rev1_604; __rev1_604 = __builtin_shufflevector(__s1_604, __s1_604, 7, 6, 5, 4, 3, 2, 1, 0); \ 55073 __ret_604 = __noswap_vmull_u16(__rev0_604, __noswap_splat_laneq_u16(__rev1_604, __p2_604)); \ 55074 __ret_604 = __builtin_shufflevector(__ret_604, __ret_604, 3, 2, 1, 0); \ 55075 __ret_604; \ 55076 }) 55077 #endif 55078 55079 #ifdef __LITTLE_ENDIAN__ 55080 #define vmull_laneq_s32(__p0_605, __p1_605, __p2_605) __extension__ ({ \ 55081 int64x2_t __ret_605; \ 55082 int32x2_t __s0_605 = __p0_605; \ 55083 int32x4_t __s1_605 = __p1_605; \ 55084 __ret_605 = vmull_s32(__s0_605, splat_laneq_s32(__s1_605, __p2_605)); \ 55085 __ret_605; \ 55086 }) 55087 #else 55088 #define vmull_laneq_s32(__p0_606, __p1_606, __p2_606) __extension__ ({ \ 55089 int64x2_t __ret_606; \ 55090 int32x2_t __s0_606 = __p0_606; \ 55091 int32x4_t __s1_606 = __p1_606; \ 55092 int32x2_t __rev0_606; __rev0_606 = __builtin_shufflevector(__s0_606, __s0_606, 1, 0); \ 55093 int32x4_t __rev1_606; __rev1_606 = __builtin_shufflevector(__s1_606, __s1_606, 3, 2, 1, 0); \ 55094 __ret_606 = __noswap_vmull_s32(__rev0_606, __noswap_splat_laneq_s32(__rev1_606, __p2_606)); \ 55095 __ret_606 = __builtin_shufflevector(__ret_606, __ret_606, 1, 0); \ 55096 __ret_606; \ 55097 }) 55098 #endif 55099 55100 #ifdef __LITTLE_ENDIAN__ 55101 #define vmull_laneq_s16(__p0_607, __p1_607, __p2_607) __extension__ ({ \ 55102 int32x4_t __ret_607; \ 55103 int16x4_t __s0_607 = __p0_607; \ 55104 int16x8_t __s1_607 = __p1_607; \ 55105 __ret_607 = vmull_s16(__s0_607, splat_laneq_s16(__s1_607, __p2_607)); \ 55106 __ret_607; \ 55107 }) 55108 #else 55109 #define vmull_laneq_s16(__p0_608, __p1_608, __p2_608) __extension__ ({ \ 55110 int32x4_t __ret_608; \ 55111 int16x4_t __s0_608 = __p0_608; \ 55112 int16x8_t __s1_608 = __p1_608; \ 55113 int16x4_t __rev0_608; __rev0_608 = __builtin_shufflevector(__s0_608, __s0_608, 3, 2, 1, 0); \ 55114 int16x8_t __rev1_608; __rev1_608 = __builtin_shufflevector(__s1_608, __s1_608, 7, 6, 5, 4, 3, 2, 1, 0); \ 55115 __ret_608 = __noswap_vmull_s16(__rev0_608, __noswap_splat_laneq_s16(__rev1_608, __p2_608)); \ 55116 __ret_608 = __builtin_shufflevector(__ret_608, __ret_608, 3, 2, 1, 0); \ 55117 __ret_608; \ 55118 }) 55119 #endif 55120 55121 #ifdef __LITTLE_ENDIAN__ 55122 __ai __attribute__((target("neon"))) float64x2_t vmulxq_f64(float64x2_t __p0, float64x2_t __p1) { 55123 float64x2_t __ret; 55124 __ret = (float64x2_t) __builtin_neon_vmulxq_v((int8x16_t)__p0, (int8x16_t)__p1, 42); 55125 return __ret; 55126 } 55127 #else 55128 __ai __attribute__((target("neon"))) float64x2_t vmulxq_f64(float64x2_t __p0, float64x2_t __p1) { 55129 float64x2_t __ret; 55130 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 55131 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 55132 __ret = (float64x2_t) __builtin_neon_vmulxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 42); 55133 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 55134 return __ret; 55135 } 55136 __ai __attribute__((target("neon"))) float64x2_t __noswap_vmulxq_f64(float64x2_t __p0, float64x2_t __p1) { 55137 float64x2_t __ret; 55138 __ret = (float64x2_t) __builtin_neon_vmulxq_v((int8x16_t)__p0, (int8x16_t)__p1, 42); 55139 return __ret; 55140 } 55141 #endif 55142 55143 #ifdef __LITTLE_ENDIAN__ 55144 __ai __attribute__((target("neon"))) float32x4_t vmulxq_f32(float32x4_t __p0, float32x4_t __p1) { 55145 float32x4_t __ret; 55146 __ret = (float32x4_t) __builtin_neon_vmulxq_v((int8x16_t)__p0, (int8x16_t)__p1, 41); 55147 return __ret; 55148 } 55149 #else 55150 __ai __attribute__((target("neon"))) float32x4_t vmulxq_f32(float32x4_t __p0, float32x4_t __p1) { 55151 float32x4_t __ret; 55152 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 55153 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 55154 __ret = (float32x4_t) __builtin_neon_vmulxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 41); 55155 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 55156 return __ret; 55157 } 55158 __ai __attribute__((target("neon"))) float32x4_t __noswap_vmulxq_f32(float32x4_t __p0, float32x4_t __p1) { 55159 float32x4_t __ret; 55160 __ret = (float32x4_t) __builtin_neon_vmulxq_v((int8x16_t)__p0, (int8x16_t)__p1, 41); 55161 return __ret; 55162 } 55163 #endif 55164 55165 __ai __attribute__((target("neon"))) float64x1_t vmulx_f64(float64x1_t __p0, float64x1_t __p1) { 55166 float64x1_t __ret; 55167 __ret = (float64x1_t) __builtin_neon_vmulx_v((int8x8_t)__p0, (int8x8_t)__p1, 10); 55168 return __ret; 55169 } 55170 #ifdef __LITTLE_ENDIAN__ 55171 __ai __attribute__((target("neon"))) float32x2_t vmulx_f32(float32x2_t __p0, float32x2_t __p1) { 55172 float32x2_t __ret; 55173 __ret = (float32x2_t) __builtin_neon_vmulx_v((int8x8_t)__p0, (int8x8_t)__p1, 9); 55174 return __ret; 55175 } 55176 #else 55177 __ai __attribute__((target("neon"))) float32x2_t vmulx_f32(float32x2_t __p0, float32x2_t __p1) { 55178 float32x2_t __ret; 55179 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 55180 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 55181 __ret = (float32x2_t) __builtin_neon_vmulx_v((int8x8_t)__rev0, (int8x8_t)__rev1, 9); 55182 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 55183 return __ret; 55184 } 55185 __ai __attribute__((target("neon"))) float32x2_t __noswap_vmulx_f32(float32x2_t __p0, float32x2_t __p1) { 55186 float32x2_t __ret; 55187 __ret = (float32x2_t) __builtin_neon_vmulx_v((int8x8_t)__p0, (int8x8_t)__p1, 9); 55188 return __ret; 55189 } 55190 #endif 55191 55192 __ai __attribute__((target("neon"))) float64_t vmulxd_f64(float64_t __p0, float64_t __p1) { 55193 float64_t __ret; 55194 __ret = (float64_t) __builtin_neon_vmulxd_f64(__p0, __p1); 55195 return __ret; 55196 } 55197 __ai __attribute__((target("neon"))) float32_t vmulxs_f32(float32_t __p0, float32_t __p1) { 55198 float32_t __ret; 55199 __ret = (float32_t) __builtin_neon_vmulxs_f32(__p0, __p1); 55200 return __ret; 55201 } 55202 #define vmulxd_lane_f64(__p0_609, __p1_609, __p2_609) __extension__ ({ \ 55203 float64_t __ret_609; \ 55204 float64_t __s0_609 = __p0_609; \ 55205 float64x1_t __s1_609 = __p1_609; \ 55206 __ret_609 = vmulxd_f64(__s0_609, vget_lane_f64(__s1_609, __p2_609)); \ 55207 __ret_609; \ 55208 }) 55209 #ifdef __LITTLE_ENDIAN__ 55210 #define vmulxs_lane_f32(__p0_610, __p1_610, __p2_610) __extension__ ({ \ 55211 float32_t __ret_610; \ 55212 float32_t __s0_610 = __p0_610; \ 55213 float32x2_t __s1_610 = __p1_610; \ 55214 __ret_610 = vmulxs_f32(__s0_610, vget_lane_f32(__s1_610, __p2_610)); \ 55215 __ret_610; \ 55216 }) 55217 #else 55218 #define vmulxs_lane_f32(__p0_611, __p1_611, __p2_611) __extension__ ({ \ 55219 float32_t __ret_611; \ 55220 float32_t __s0_611 = __p0_611; \ 55221 float32x2_t __s1_611 = __p1_611; \ 55222 float32x2_t __rev1_611; __rev1_611 = __builtin_shufflevector(__s1_611, __s1_611, 1, 0); \ 55223 __ret_611 = vmulxs_f32(__s0_611, __noswap_vget_lane_f32(__rev1_611, __p2_611)); \ 55224 __ret_611; \ 55225 }) 55226 #endif 55227 55228 #ifdef __LITTLE_ENDIAN__ 55229 #define vmulxq_lane_f64(__p0_612, __p1_612, __p2_612) __extension__ ({ \ 55230 float64x2_t __ret_612; \ 55231 float64x2_t __s0_612 = __p0_612; \ 55232 float64x1_t __s1_612 = __p1_612; \ 55233 __ret_612 = vmulxq_f64(__s0_612, splatq_lane_f64(__s1_612, __p2_612)); \ 55234 __ret_612; \ 55235 }) 55236 #else 55237 #define vmulxq_lane_f64(__p0_613, __p1_613, __p2_613) __extension__ ({ \ 55238 float64x2_t __ret_613; \ 55239 float64x2_t __s0_613 = __p0_613; \ 55240 float64x1_t __s1_613 = __p1_613; \ 55241 float64x2_t __rev0_613; __rev0_613 = __builtin_shufflevector(__s0_613, __s0_613, 1, 0); \ 55242 __ret_613 = __noswap_vmulxq_f64(__rev0_613, __noswap_splatq_lane_f64(__s1_613, __p2_613)); \ 55243 __ret_613 = __builtin_shufflevector(__ret_613, __ret_613, 1, 0); \ 55244 __ret_613; \ 55245 }) 55246 #endif 55247 55248 #ifdef __LITTLE_ENDIAN__ 55249 #define vmulxq_lane_f32(__p0_614, __p1_614, __p2_614) __extension__ ({ \ 55250 float32x4_t __ret_614; \ 55251 float32x4_t __s0_614 = __p0_614; \ 55252 float32x2_t __s1_614 = __p1_614; \ 55253 __ret_614 = vmulxq_f32(__s0_614, splatq_lane_f32(__s1_614, __p2_614)); \ 55254 __ret_614; \ 55255 }) 55256 #else 55257 #define vmulxq_lane_f32(__p0_615, __p1_615, __p2_615) __extension__ ({ \ 55258 float32x4_t __ret_615; \ 55259 float32x4_t __s0_615 = __p0_615; \ 55260 float32x2_t __s1_615 = __p1_615; \ 55261 float32x4_t __rev0_615; __rev0_615 = __builtin_shufflevector(__s0_615, __s0_615, 3, 2, 1, 0); \ 55262 float32x2_t __rev1_615; __rev1_615 = __builtin_shufflevector(__s1_615, __s1_615, 1, 0); \ 55263 __ret_615 = __noswap_vmulxq_f32(__rev0_615, __noswap_splatq_lane_f32(__rev1_615, __p2_615)); \ 55264 __ret_615 = __builtin_shufflevector(__ret_615, __ret_615, 3, 2, 1, 0); \ 55265 __ret_615; \ 55266 }) 55267 #endif 55268 55269 #ifdef __LITTLE_ENDIAN__ 55270 #define vmulx_lane_f32(__p0_616, __p1_616, __p2_616) __extension__ ({ \ 55271 float32x2_t __ret_616; \ 55272 float32x2_t __s0_616 = __p0_616; \ 55273 float32x2_t __s1_616 = __p1_616; \ 55274 __ret_616 = vmulx_f32(__s0_616, splat_lane_f32(__s1_616, __p2_616)); \ 55275 __ret_616; \ 55276 }) 55277 #else 55278 #define vmulx_lane_f32(__p0_617, __p1_617, __p2_617) __extension__ ({ \ 55279 float32x2_t __ret_617; \ 55280 float32x2_t __s0_617 = __p0_617; \ 55281 float32x2_t __s1_617 = __p1_617; \ 55282 float32x2_t __rev0_617; __rev0_617 = __builtin_shufflevector(__s0_617, __s0_617, 1, 0); \ 55283 float32x2_t __rev1_617; __rev1_617 = __builtin_shufflevector(__s1_617, __s1_617, 1, 0); \ 55284 __ret_617 = __noswap_vmulx_f32(__rev0_617, __noswap_splat_lane_f32(__rev1_617, __p2_617)); \ 55285 __ret_617 = __builtin_shufflevector(__ret_617, __ret_617, 1, 0); \ 55286 __ret_617; \ 55287 }) 55288 #endif 55289 55290 #ifdef __LITTLE_ENDIAN__ 55291 #define vmulxd_laneq_f64(__p0_618, __p1_618, __p2_618) __extension__ ({ \ 55292 float64_t __ret_618; \ 55293 float64_t __s0_618 = __p0_618; \ 55294 float64x2_t __s1_618 = __p1_618; \ 55295 __ret_618 = vmulxd_f64(__s0_618, vgetq_lane_f64(__s1_618, __p2_618)); \ 55296 __ret_618; \ 55297 }) 55298 #else 55299 #define vmulxd_laneq_f64(__p0_619, __p1_619, __p2_619) __extension__ ({ \ 55300 float64_t __ret_619; \ 55301 float64_t __s0_619 = __p0_619; \ 55302 float64x2_t __s1_619 = __p1_619; \ 55303 float64x2_t __rev1_619; __rev1_619 = __builtin_shufflevector(__s1_619, __s1_619, 1, 0); \ 55304 __ret_619 = vmulxd_f64(__s0_619, __noswap_vgetq_lane_f64(__rev1_619, __p2_619)); \ 55305 __ret_619; \ 55306 }) 55307 #endif 55308 55309 #ifdef __LITTLE_ENDIAN__ 55310 #define vmulxs_laneq_f32(__p0_620, __p1_620, __p2_620) __extension__ ({ \ 55311 float32_t __ret_620; \ 55312 float32_t __s0_620 = __p0_620; \ 55313 float32x4_t __s1_620 = __p1_620; \ 55314 __ret_620 = vmulxs_f32(__s0_620, vgetq_lane_f32(__s1_620, __p2_620)); \ 55315 __ret_620; \ 55316 }) 55317 #else 55318 #define vmulxs_laneq_f32(__p0_621, __p1_621, __p2_621) __extension__ ({ \ 55319 float32_t __ret_621; \ 55320 float32_t __s0_621 = __p0_621; \ 55321 float32x4_t __s1_621 = __p1_621; \ 55322 float32x4_t __rev1_621; __rev1_621 = __builtin_shufflevector(__s1_621, __s1_621, 3, 2, 1, 0); \ 55323 __ret_621 = vmulxs_f32(__s0_621, __noswap_vgetq_lane_f32(__rev1_621, __p2_621)); \ 55324 __ret_621; \ 55325 }) 55326 #endif 55327 55328 #ifdef __LITTLE_ENDIAN__ 55329 #define vmulxq_laneq_f64(__p0_622, __p1_622, __p2_622) __extension__ ({ \ 55330 float64x2_t __ret_622; \ 55331 float64x2_t __s0_622 = __p0_622; \ 55332 float64x2_t __s1_622 = __p1_622; \ 55333 __ret_622 = vmulxq_f64(__s0_622, splatq_laneq_f64(__s1_622, __p2_622)); \ 55334 __ret_622; \ 55335 }) 55336 #else 55337 #define vmulxq_laneq_f64(__p0_623, __p1_623, __p2_623) __extension__ ({ \ 55338 float64x2_t __ret_623; \ 55339 float64x2_t __s0_623 = __p0_623; \ 55340 float64x2_t __s1_623 = __p1_623; \ 55341 float64x2_t __rev0_623; __rev0_623 = __builtin_shufflevector(__s0_623, __s0_623, 1, 0); \ 55342 float64x2_t __rev1_623; __rev1_623 = __builtin_shufflevector(__s1_623, __s1_623, 1, 0); \ 55343 __ret_623 = __noswap_vmulxq_f64(__rev0_623, __noswap_splatq_laneq_f64(__rev1_623, __p2_623)); \ 55344 __ret_623 = __builtin_shufflevector(__ret_623, __ret_623, 1, 0); \ 55345 __ret_623; \ 55346 }) 55347 #endif 55348 55349 #ifdef __LITTLE_ENDIAN__ 55350 #define vmulxq_laneq_f32(__p0_624, __p1_624, __p2_624) __extension__ ({ \ 55351 float32x4_t __ret_624; \ 55352 float32x4_t __s0_624 = __p0_624; \ 55353 float32x4_t __s1_624 = __p1_624; \ 55354 __ret_624 = vmulxq_f32(__s0_624, splatq_laneq_f32(__s1_624, __p2_624)); \ 55355 __ret_624; \ 55356 }) 55357 #else 55358 #define vmulxq_laneq_f32(__p0_625, __p1_625, __p2_625) __extension__ ({ \ 55359 float32x4_t __ret_625; \ 55360 float32x4_t __s0_625 = __p0_625; \ 55361 float32x4_t __s1_625 = __p1_625; \ 55362 float32x4_t __rev0_625; __rev0_625 = __builtin_shufflevector(__s0_625, __s0_625, 3, 2, 1, 0); \ 55363 float32x4_t __rev1_625; __rev1_625 = __builtin_shufflevector(__s1_625, __s1_625, 3, 2, 1, 0); \ 55364 __ret_625 = __noswap_vmulxq_f32(__rev0_625, __noswap_splatq_laneq_f32(__rev1_625, __p2_625)); \ 55365 __ret_625 = __builtin_shufflevector(__ret_625, __ret_625, 3, 2, 1, 0); \ 55366 __ret_625; \ 55367 }) 55368 #endif 55369 55370 #ifdef __LITTLE_ENDIAN__ 55371 #define vmulx_laneq_f32(__p0_626, __p1_626, __p2_626) __extension__ ({ \ 55372 float32x2_t __ret_626; \ 55373 float32x2_t __s0_626 = __p0_626; \ 55374 float32x4_t __s1_626 = __p1_626; \ 55375 __ret_626 = vmulx_f32(__s0_626, splat_laneq_f32(__s1_626, __p2_626)); \ 55376 __ret_626; \ 55377 }) 55378 #else 55379 #define vmulx_laneq_f32(__p0_627, __p1_627, __p2_627) __extension__ ({ \ 55380 float32x2_t __ret_627; \ 55381 float32x2_t __s0_627 = __p0_627; \ 55382 float32x4_t __s1_627 = __p1_627; \ 55383 float32x2_t __rev0_627; __rev0_627 = __builtin_shufflevector(__s0_627, __s0_627, 1, 0); \ 55384 float32x4_t __rev1_627; __rev1_627 = __builtin_shufflevector(__s1_627, __s1_627, 3, 2, 1, 0); \ 55385 __ret_627 = __noswap_vmulx_f32(__rev0_627, __noswap_splat_laneq_f32(__rev1_627, __p2_627)); \ 55386 __ret_627 = __builtin_shufflevector(__ret_627, __ret_627, 1, 0); \ 55387 __ret_627; \ 55388 }) 55389 #endif 55390 55391 #ifdef __LITTLE_ENDIAN__ 55392 __ai __attribute__((target("neon"))) float64x2_t vnegq_f64(float64x2_t __p0) { 55393 float64x2_t __ret; 55394 __ret = -__p0; 55395 return __ret; 55396 } 55397 #else 55398 __ai __attribute__((target("neon"))) float64x2_t vnegq_f64(float64x2_t __p0) { 55399 float64x2_t __ret; 55400 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 55401 __ret = -__rev0; 55402 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 55403 return __ret; 55404 } 55405 #endif 55406 55407 #ifdef __LITTLE_ENDIAN__ 55408 __ai __attribute__((target("neon"))) int64x2_t vnegq_s64(int64x2_t __p0) { 55409 int64x2_t __ret; 55410 __ret = -__p0; 55411 return __ret; 55412 } 55413 #else 55414 __ai __attribute__((target("neon"))) int64x2_t vnegq_s64(int64x2_t __p0) { 55415 int64x2_t __ret; 55416 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 55417 __ret = -__rev0; 55418 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 55419 return __ret; 55420 } 55421 #endif 55422 55423 __ai __attribute__((target("neon"))) float64x1_t vneg_f64(float64x1_t __p0) { 55424 float64x1_t __ret; 55425 __ret = -__p0; 55426 return __ret; 55427 } 55428 __ai __attribute__((target("neon"))) int64x1_t vneg_s64(int64x1_t __p0) { 55429 int64x1_t __ret; 55430 __ret = -__p0; 55431 return __ret; 55432 } 55433 __ai __attribute__((target("neon"))) int64_t vnegd_s64(int64_t __p0) { 55434 int64_t __ret; 55435 __ret = (int64_t) __builtin_neon_vnegd_s64(__p0); 55436 return __ret; 55437 } 55438 #ifdef __LITTLE_ENDIAN__ 55439 __ai __attribute__((target("neon"))) uint8x16_t vpaddq_u8(uint8x16_t __p0, uint8x16_t __p1) { 55440 uint8x16_t __ret; 55441 __ret = (uint8x16_t) __builtin_neon_vpaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 48); 55442 return __ret; 55443 } 55444 #else 55445 __ai __attribute__((target("neon"))) uint8x16_t vpaddq_u8(uint8x16_t __p0, uint8x16_t __p1) { 55446 uint8x16_t __ret; 55447 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 55448 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 55449 __ret = (uint8x16_t) __builtin_neon_vpaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48); 55450 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 55451 return __ret; 55452 } 55453 #endif 55454 55455 #ifdef __LITTLE_ENDIAN__ 55456 __ai __attribute__((target("neon"))) uint32x4_t vpaddq_u32(uint32x4_t __p0, uint32x4_t __p1) { 55457 uint32x4_t __ret; 55458 __ret = (uint32x4_t) __builtin_neon_vpaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 50); 55459 return __ret; 55460 } 55461 #else 55462 __ai __attribute__((target("neon"))) uint32x4_t vpaddq_u32(uint32x4_t __p0, uint32x4_t __p1) { 55463 uint32x4_t __ret; 55464 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 55465 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 55466 __ret = (uint32x4_t) __builtin_neon_vpaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50); 55467 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 55468 return __ret; 55469 } 55470 #endif 55471 55472 #ifdef __LITTLE_ENDIAN__ 55473 __ai __attribute__((target("neon"))) uint64x2_t vpaddq_u64(uint64x2_t __p0, uint64x2_t __p1) { 55474 uint64x2_t __ret; 55475 __ret = (uint64x2_t) __builtin_neon_vpaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 51); 55476 return __ret; 55477 } 55478 #else 55479 __ai __attribute__((target("neon"))) uint64x2_t vpaddq_u64(uint64x2_t __p0, uint64x2_t __p1) { 55480 uint64x2_t __ret; 55481 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 55482 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 55483 __ret = (uint64x2_t) __builtin_neon_vpaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 51); 55484 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 55485 return __ret; 55486 } 55487 #endif 55488 55489 #ifdef __LITTLE_ENDIAN__ 55490 __ai __attribute__((target("neon"))) uint16x8_t vpaddq_u16(uint16x8_t __p0, uint16x8_t __p1) { 55491 uint16x8_t __ret; 55492 __ret = (uint16x8_t) __builtin_neon_vpaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 49); 55493 return __ret; 55494 } 55495 #else 55496 __ai __attribute__((target("neon"))) uint16x8_t vpaddq_u16(uint16x8_t __p0, uint16x8_t __p1) { 55497 uint16x8_t __ret; 55498 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 55499 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 55500 __ret = (uint16x8_t) __builtin_neon_vpaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49); 55501 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 55502 return __ret; 55503 } 55504 #endif 55505 55506 #ifdef __LITTLE_ENDIAN__ 55507 __ai __attribute__((target("neon"))) int8x16_t vpaddq_s8(int8x16_t __p0, int8x16_t __p1) { 55508 int8x16_t __ret; 55509 __ret = (int8x16_t) __builtin_neon_vpaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 32); 55510 return __ret; 55511 } 55512 #else 55513 __ai __attribute__((target("neon"))) int8x16_t vpaddq_s8(int8x16_t __p0, int8x16_t __p1) { 55514 int8x16_t __ret; 55515 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 55516 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 55517 __ret = (int8x16_t) __builtin_neon_vpaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32); 55518 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 55519 return __ret; 55520 } 55521 #endif 55522 55523 #ifdef __LITTLE_ENDIAN__ 55524 __ai __attribute__((target("neon"))) float64x2_t vpaddq_f64(float64x2_t __p0, float64x2_t __p1) { 55525 float64x2_t __ret; 55526 __ret = (float64x2_t) __builtin_neon_vpaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 42); 55527 return __ret; 55528 } 55529 #else 55530 __ai __attribute__((target("neon"))) float64x2_t vpaddq_f64(float64x2_t __p0, float64x2_t __p1) { 55531 float64x2_t __ret; 55532 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 55533 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 55534 __ret = (float64x2_t) __builtin_neon_vpaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 42); 55535 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 55536 return __ret; 55537 } 55538 #endif 55539 55540 #ifdef __LITTLE_ENDIAN__ 55541 __ai __attribute__((target("neon"))) float32x4_t vpaddq_f32(float32x4_t __p0, float32x4_t __p1) { 55542 float32x4_t __ret; 55543 __ret = (float32x4_t) __builtin_neon_vpaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 41); 55544 return __ret; 55545 } 55546 #else 55547 __ai __attribute__((target("neon"))) float32x4_t vpaddq_f32(float32x4_t __p0, float32x4_t __p1) { 55548 float32x4_t __ret; 55549 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 55550 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 55551 __ret = (float32x4_t) __builtin_neon_vpaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 41); 55552 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 55553 return __ret; 55554 } 55555 #endif 55556 55557 #ifdef __LITTLE_ENDIAN__ 55558 __ai __attribute__((target("neon"))) int32x4_t vpaddq_s32(int32x4_t __p0, int32x4_t __p1) { 55559 int32x4_t __ret; 55560 __ret = (int32x4_t) __builtin_neon_vpaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 34); 55561 return __ret; 55562 } 55563 #else 55564 __ai __attribute__((target("neon"))) int32x4_t vpaddq_s32(int32x4_t __p0, int32x4_t __p1) { 55565 int32x4_t __ret; 55566 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 55567 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 55568 __ret = (int32x4_t) __builtin_neon_vpaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34); 55569 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 55570 return __ret; 55571 } 55572 #endif 55573 55574 #ifdef __LITTLE_ENDIAN__ 55575 __ai __attribute__((target("neon"))) int64x2_t vpaddq_s64(int64x2_t __p0, int64x2_t __p1) { 55576 int64x2_t __ret; 55577 __ret = (int64x2_t) __builtin_neon_vpaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 35); 55578 return __ret; 55579 } 55580 #else 55581 __ai __attribute__((target("neon"))) int64x2_t vpaddq_s64(int64x2_t __p0, int64x2_t __p1) { 55582 int64x2_t __ret; 55583 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 55584 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 55585 __ret = (int64x2_t) __builtin_neon_vpaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 35); 55586 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 55587 return __ret; 55588 } 55589 #endif 55590 55591 #ifdef __LITTLE_ENDIAN__ 55592 __ai __attribute__((target("neon"))) int16x8_t vpaddq_s16(int16x8_t __p0, int16x8_t __p1) { 55593 int16x8_t __ret; 55594 __ret = (int16x8_t) __builtin_neon_vpaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 33); 55595 return __ret; 55596 } 55597 #else 55598 __ai __attribute__((target("neon"))) int16x8_t vpaddq_s16(int16x8_t __p0, int16x8_t __p1) { 55599 int16x8_t __ret; 55600 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 55601 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 55602 __ret = (int16x8_t) __builtin_neon_vpaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33); 55603 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 55604 return __ret; 55605 } 55606 #endif 55607 55608 #ifdef __LITTLE_ENDIAN__ 55609 __ai __attribute__((target("neon"))) uint64_t vpaddd_u64(uint64x2_t __p0) { 55610 uint64_t __ret; 55611 __ret = (uint64_t) __builtin_neon_vpaddd_u64(__p0); 55612 return __ret; 55613 } 55614 #else 55615 __ai __attribute__((target("neon"))) uint64_t vpaddd_u64(uint64x2_t __p0) { 55616 uint64_t __ret; 55617 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 55618 __ret = (uint64_t) __builtin_neon_vpaddd_u64(__rev0); 55619 return __ret; 55620 } 55621 #endif 55622 55623 #ifdef __LITTLE_ENDIAN__ 55624 __ai __attribute__((target("neon"))) float64_t vpaddd_f64(float64x2_t __p0) { 55625 float64_t __ret; 55626 __ret = (float64_t) __builtin_neon_vpaddd_f64(__p0); 55627 return __ret; 55628 } 55629 #else 55630 __ai __attribute__((target("neon"))) float64_t vpaddd_f64(float64x2_t __p0) { 55631 float64_t __ret; 55632 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 55633 __ret = (float64_t) __builtin_neon_vpaddd_f64(__rev0); 55634 return __ret; 55635 } 55636 #endif 55637 55638 #ifdef __LITTLE_ENDIAN__ 55639 __ai __attribute__((target("neon"))) int64_t vpaddd_s64(int64x2_t __p0) { 55640 int64_t __ret; 55641 __ret = (int64_t) __builtin_neon_vpaddd_s64(__p0); 55642 return __ret; 55643 } 55644 #else 55645 __ai __attribute__((target("neon"))) int64_t vpaddd_s64(int64x2_t __p0) { 55646 int64_t __ret; 55647 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 55648 __ret = (int64_t) __builtin_neon_vpaddd_s64(__rev0); 55649 return __ret; 55650 } 55651 #endif 55652 55653 #ifdef __LITTLE_ENDIAN__ 55654 __ai __attribute__((target("neon"))) float32_t vpadds_f32(float32x2_t __p0) { 55655 float32_t __ret; 55656 __ret = (float32_t) __builtin_neon_vpadds_f32(__p0); 55657 return __ret; 55658 } 55659 #else 55660 __ai __attribute__((target("neon"))) float32_t vpadds_f32(float32x2_t __p0) { 55661 float32_t __ret; 55662 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 55663 __ret = (float32_t) __builtin_neon_vpadds_f32(__rev0); 55664 return __ret; 55665 } 55666 #endif 55667 55668 #ifdef __LITTLE_ENDIAN__ 55669 __ai __attribute__((target("neon"))) uint8x16_t vpmaxq_u8(uint8x16_t __p0, uint8x16_t __p1) { 55670 uint8x16_t __ret; 55671 __ret = (uint8x16_t) __builtin_neon_vpmaxq_v((int8x16_t)__p0, (int8x16_t)__p1, 48); 55672 return __ret; 55673 } 55674 #else 55675 __ai __attribute__((target("neon"))) uint8x16_t vpmaxq_u8(uint8x16_t __p0, uint8x16_t __p1) { 55676 uint8x16_t __ret; 55677 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 55678 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 55679 __ret = (uint8x16_t) __builtin_neon_vpmaxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48); 55680 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 55681 return __ret; 55682 } 55683 #endif 55684 55685 #ifdef __LITTLE_ENDIAN__ 55686 __ai __attribute__((target("neon"))) uint32x4_t vpmaxq_u32(uint32x4_t __p0, uint32x4_t __p1) { 55687 uint32x4_t __ret; 55688 __ret = (uint32x4_t) __builtin_neon_vpmaxq_v((int8x16_t)__p0, (int8x16_t)__p1, 50); 55689 return __ret; 55690 } 55691 #else 55692 __ai __attribute__((target("neon"))) uint32x4_t vpmaxq_u32(uint32x4_t __p0, uint32x4_t __p1) { 55693 uint32x4_t __ret; 55694 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 55695 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 55696 __ret = (uint32x4_t) __builtin_neon_vpmaxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50); 55697 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 55698 return __ret; 55699 } 55700 #endif 55701 55702 #ifdef __LITTLE_ENDIAN__ 55703 __ai __attribute__((target("neon"))) uint16x8_t vpmaxq_u16(uint16x8_t __p0, uint16x8_t __p1) { 55704 uint16x8_t __ret; 55705 __ret = (uint16x8_t) __builtin_neon_vpmaxq_v((int8x16_t)__p0, (int8x16_t)__p1, 49); 55706 return __ret; 55707 } 55708 #else 55709 __ai __attribute__((target("neon"))) uint16x8_t vpmaxq_u16(uint16x8_t __p0, uint16x8_t __p1) { 55710 uint16x8_t __ret; 55711 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 55712 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 55713 __ret = (uint16x8_t) __builtin_neon_vpmaxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49); 55714 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 55715 return __ret; 55716 } 55717 #endif 55718 55719 #ifdef __LITTLE_ENDIAN__ 55720 __ai __attribute__((target("neon"))) int8x16_t vpmaxq_s8(int8x16_t __p0, int8x16_t __p1) { 55721 int8x16_t __ret; 55722 __ret = (int8x16_t) __builtin_neon_vpmaxq_v((int8x16_t)__p0, (int8x16_t)__p1, 32); 55723 return __ret; 55724 } 55725 #else 55726 __ai __attribute__((target("neon"))) int8x16_t vpmaxq_s8(int8x16_t __p0, int8x16_t __p1) { 55727 int8x16_t __ret; 55728 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 55729 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 55730 __ret = (int8x16_t) __builtin_neon_vpmaxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32); 55731 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 55732 return __ret; 55733 } 55734 #endif 55735 55736 #ifdef __LITTLE_ENDIAN__ 55737 __ai __attribute__((target("neon"))) float64x2_t vpmaxq_f64(float64x2_t __p0, float64x2_t __p1) { 55738 float64x2_t __ret; 55739 __ret = (float64x2_t) __builtin_neon_vpmaxq_v((int8x16_t)__p0, (int8x16_t)__p1, 42); 55740 return __ret; 55741 } 55742 #else 55743 __ai __attribute__((target("neon"))) float64x2_t vpmaxq_f64(float64x2_t __p0, float64x2_t __p1) { 55744 float64x2_t __ret; 55745 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 55746 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 55747 __ret = (float64x2_t) __builtin_neon_vpmaxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 42); 55748 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 55749 return __ret; 55750 } 55751 #endif 55752 55753 #ifdef __LITTLE_ENDIAN__ 55754 __ai __attribute__((target("neon"))) float32x4_t vpmaxq_f32(float32x4_t __p0, float32x4_t __p1) { 55755 float32x4_t __ret; 55756 __ret = (float32x4_t) __builtin_neon_vpmaxq_v((int8x16_t)__p0, (int8x16_t)__p1, 41); 55757 return __ret; 55758 } 55759 #else 55760 __ai __attribute__((target("neon"))) float32x4_t vpmaxq_f32(float32x4_t __p0, float32x4_t __p1) { 55761 float32x4_t __ret; 55762 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 55763 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 55764 __ret = (float32x4_t) __builtin_neon_vpmaxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 41); 55765 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 55766 return __ret; 55767 } 55768 #endif 55769 55770 #ifdef __LITTLE_ENDIAN__ 55771 __ai __attribute__((target("neon"))) int32x4_t vpmaxq_s32(int32x4_t __p0, int32x4_t __p1) { 55772 int32x4_t __ret; 55773 __ret = (int32x4_t) __builtin_neon_vpmaxq_v((int8x16_t)__p0, (int8x16_t)__p1, 34); 55774 return __ret; 55775 } 55776 #else 55777 __ai __attribute__((target("neon"))) int32x4_t vpmaxq_s32(int32x4_t __p0, int32x4_t __p1) { 55778 int32x4_t __ret; 55779 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 55780 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 55781 __ret = (int32x4_t) __builtin_neon_vpmaxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34); 55782 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 55783 return __ret; 55784 } 55785 #endif 55786 55787 #ifdef __LITTLE_ENDIAN__ 55788 __ai __attribute__((target("neon"))) int16x8_t vpmaxq_s16(int16x8_t __p0, int16x8_t __p1) { 55789 int16x8_t __ret; 55790 __ret = (int16x8_t) __builtin_neon_vpmaxq_v((int8x16_t)__p0, (int8x16_t)__p1, 33); 55791 return __ret; 55792 } 55793 #else 55794 __ai __attribute__((target("neon"))) int16x8_t vpmaxq_s16(int16x8_t __p0, int16x8_t __p1) { 55795 int16x8_t __ret; 55796 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 55797 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 55798 __ret = (int16x8_t) __builtin_neon_vpmaxq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33); 55799 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 55800 return __ret; 55801 } 55802 #endif 55803 55804 #ifdef __LITTLE_ENDIAN__ 55805 __ai __attribute__((target("neon"))) float64_t vpmaxqd_f64(float64x2_t __p0) { 55806 float64_t __ret; 55807 __ret = (float64_t) __builtin_neon_vpmaxqd_f64(__p0); 55808 return __ret; 55809 } 55810 #else 55811 __ai __attribute__((target("neon"))) float64_t vpmaxqd_f64(float64x2_t __p0) { 55812 float64_t __ret; 55813 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 55814 __ret = (float64_t) __builtin_neon_vpmaxqd_f64(__rev0); 55815 return __ret; 55816 } 55817 #endif 55818 55819 #ifdef __LITTLE_ENDIAN__ 55820 __ai __attribute__((target("neon"))) float32_t vpmaxs_f32(float32x2_t __p0) { 55821 float32_t __ret; 55822 __ret = (float32_t) __builtin_neon_vpmaxs_f32(__p0); 55823 return __ret; 55824 } 55825 #else 55826 __ai __attribute__((target("neon"))) float32_t vpmaxs_f32(float32x2_t __p0) { 55827 float32_t __ret; 55828 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 55829 __ret = (float32_t) __builtin_neon_vpmaxs_f32(__rev0); 55830 return __ret; 55831 } 55832 #endif 55833 55834 #ifdef __LITTLE_ENDIAN__ 55835 __ai __attribute__((target("neon"))) float64x2_t vpmaxnmq_f64(float64x2_t __p0, float64x2_t __p1) { 55836 float64x2_t __ret; 55837 __ret = (float64x2_t) __builtin_neon_vpmaxnmq_v((int8x16_t)__p0, (int8x16_t)__p1, 42); 55838 return __ret; 55839 } 55840 #else 55841 __ai __attribute__((target("neon"))) float64x2_t vpmaxnmq_f64(float64x2_t __p0, float64x2_t __p1) { 55842 float64x2_t __ret; 55843 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 55844 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 55845 __ret = (float64x2_t) __builtin_neon_vpmaxnmq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 42); 55846 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 55847 return __ret; 55848 } 55849 #endif 55850 55851 #ifdef __LITTLE_ENDIAN__ 55852 __ai __attribute__((target("neon"))) float32x4_t vpmaxnmq_f32(float32x4_t __p0, float32x4_t __p1) { 55853 float32x4_t __ret; 55854 __ret = (float32x4_t) __builtin_neon_vpmaxnmq_v((int8x16_t)__p0, (int8x16_t)__p1, 41); 55855 return __ret; 55856 } 55857 #else 55858 __ai __attribute__((target("neon"))) float32x4_t vpmaxnmq_f32(float32x4_t __p0, float32x4_t __p1) { 55859 float32x4_t __ret; 55860 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 55861 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 55862 __ret = (float32x4_t) __builtin_neon_vpmaxnmq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 41); 55863 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 55864 return __ret; 55865 } 55866 #endif 55867 55868 #ifdef __LITTLE_ENDIAN__ 55869 __ai __attribute__((target("neon"))) float32x2_t vpmaxnm_f32(float32x2_t __p0, float32x2_t __p1) { 55870 float32x2_t __ret; 55871 __ret = (float32x2_t) __builtin_neon_vpmaxnm_v((int8x8_t)__p0, (int8x8_t)__p1, 9); 55872 return __ret; 55873 } 55874 #else 55875 __ai __attribute__((target("neon"))) float32x2_t vpmaxnm_f32(float32x2_t __p0, float32x2_t __p1) { 55876 float32x2_t __ret; 55877 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 55878 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 55879 __ret = (float32x2_t) __builtin_neon_vpmaxnm_v((int8x8_t)__rev0, (int8x8_t)__rev1, 9); 55880 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 55881 return __ret; 55882 } 55883 #endif 55884 55885 #ifdef __LITTLE_ENDIAN__ 55886 __ai __attribute__((target("neon"))) float64_t vpmaxnmqd_f64(float64x2_t __p0) { 55887 float64_t __ret; 55888 __ret = (float64_t) __builtin_neon_vpmaxnmqd_f64(__p0); 55889 return __ret; 55890 } 55891 #else 55892 __ai __attribute__((target("neon"))) float64_t vpmaxnmqd_f64(float64x2_t __p0) { 55893 float64_t __ret; 55894 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 55895 __ret = (float64_t) __builtin_neon_vpmaxnmqd_f64(__rev0); 55896 return __ret; 55897 } 55898 #endif 55899 55900 #ifdef __LITTLE_ENDIAN__ 55901 __ai __attribute__((target("neon"))) float32_t vpmaxnms_f32(float32x2_t __p0) { 55902 float32_t __ret; 55903 __ret = (float32_t) __builtin_neon_vpmaxnms_f32(__p0); 55904 return __ret; 55905 } 55906 #else 55907 __ai __attribute__((target("neon"))) float32_t vpmaxnms_f32(float32x2_t __p0) { 55908 float32_t __ret; 55909 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 55910 __ret = (float32_t) __builtin_neon_vpmaxnms_f32(__rev0); 55911 return __ret; 55912 } 55913 #endif 55914 55915 #ifdef __LITTLE_ENDIAN__ 55916 __ai __attribute__((target("neon"))) uint8x16_t vpminq_u8(uint8x16_t __p0, uint8x16_t __p1) { 55917 uint8x16_t __ret; 55918 __ret = (uint8x16_t) __builtin_neon_vpminq_v((int8x16_t)__p0, (int8x16_t)__p1, 48); 55919 return __ret; 55920 } 55921 #else 55922 __ai __attribute__((target("neon"))) uint8x16_t vpminq_u8(uint8x16_t __p0, uint8x16_t __p1) { 55923 uint8x16_t __ret; 55924 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 55925 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 55926 __ret = (uint8x16_t) __builtin_neon_vpminq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48); 55927 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 55928 return __ret; 55929 } 55930 #endif 55931 55932 #ifdef __LITTLE_ENDIAN__ 55933 __ai __attribute__((target("neon"))) uint32x4_t vpminq_u32(uint32x4_t __p0, uint32x4_t __p1) { 55934 uint32x4_t __ret; 55935 __ret = (uint32x4_t) __builtin_neon_vpminq_v((int8x16_t)__p0, (int8x16_t)__p1, 50); 55936 return __ret; 55937 } 55938 #else 55939 __ai __attribute__((target("neon"))) uint32x4_t vpminq_u32(uint32x4_t __p0, uint32x4_t __p1) { 55940 uint32x4_t __ret; 55941 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 55942 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 55943 __ret = (uint32x4_t) __builtin_neon_vpminq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50); 55944 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 55945 return __ret; 55946 } 55947 #endif 55948 55949 #ifdef __LITTLE_ENDIAN__ 55950 __ai __attribute__((target("neon"))) uint16x8_t vpminq_u16(uint16x8_t __p0, uint16x8_t __p1) { 55951 uint16x8_t __ret; 55952 __ret = (uint16x8_t) __builtin_neon_vpminq_v((int8x16_t)__p0, (int8x16_t)__p1, 49); 55953 return __ret; 55954 } 55955 #else 55956 __ai __attribute__((target("neon"))) uint16x8_t vpminq_u16(uint16x8_t __p0, uint16x8_t __p1) { 55957 uint16x8_t __ret; 55958 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 55959 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 55960 __ret = (uint16x8_t) __builtin_neon_vpminq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49); 55961 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 55962 return __ret; 55963 } 55964 #endif 55965 55966 #ifdef __LITTLE_ENDIAN__ 55967 __ai __attribute__((target("neon"))) int8x16_t vpminq_s8(int8x16_t __p0, int8x16_t __p1) { 55968 int8x16_t __ret; 55969 __ret = (int8x16_t) __builtin_neon_vpminq_v((int8x16_t)__p0, (int8x16_t)__p1, 32); 55970 return __ret; 55971 } 55972 #else 55973 __ai __attribute__((target("neon"))) int8x16_t vpminq_s8(int8x16_t __p0, int8x16_t __p1) { 55974 int8x16_t __ret; 55975 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 55976 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 55977 __ret = (int8x16_t) __builtin_neon_vpminq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32); 55978 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 55979 return __ret; 55980 } 55981 #endif 55982 55983 #ifdef __LITTLE_ENDIAN__ 55984 __ai __attribute__((target("neon"))) float64x2_t vpminq_f64(float64x2_t __p0, float64x2_t __p1) { 55985 float64x2_t __ret; 55986 __ret = (float64x2_t) __builtin_neon_vpminq_v((int8x16_t)__p0, (int8x16_t)__p1, 42); 55987 return __ret; 55988 } 55989 #else 55990 __ai __attribute__((target("neon"))) float64x2_t vpminq_f64(float64x2_t __p0, float64x2_t __p1) { 55991 float64x2_t __ret; 55992 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 55993 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 55994 __ret = (float64x2_t) __builtin_neon_vpminq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 42); 55995 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 55996 return __ret; 55997 } 55998 #endif 55999 56000 #ifdef __LITTLE_ENDIAN__ 56001 __ai __attribute__((target("neon"))) float32x4_t vpminq_f32(float32x4_t __p0, float32x4_t __p1) { 56002 float32x4_t __ret; 56003 __ret = (float32x4_t) __builtin_neon_vpminq_v((int8x16_t)__p0, (int8x16_t)__p1, 41); 56004 return __ret; 56005 } 56006 #else 56007 __ai __attribute__((target("neon"))) float32x4_t vpminq_f32(float32x4_t __p0, float32x4_t __p1) { 56008 float32x4_t __ret; 56009 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 56010 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 56011 __ret = (float32x4_t) __builtin_neon_vpminq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 41); 56012 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 56013 return __ret; 56014 } 56015 #endif 56016 56017 #ifdef __LITTLE_ENDIAN__ 56018 __ai __attribute__((target("neon"))) int32x4_t vpminq_s32(int32x4_t __p0, int32x4_t __p1) { 56019 int32x4_t __ret; 56020 __ret = (int32x4_t) __builtin_neon_vpminq_v((int8x16_t)__p0, (int8x16_t)__p1, 34); 56021 return __ret; 56022 } 56023 #else 56024 __ai __attribute__((target("neon"))) int32x4_t vpminq_s32(int32x4_t __p0, int32x4_t __p1) { 56025 int32x4_t __ret; 56026 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 56027 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 56028 __ret = (int32x4_t) __builtin_neon_vpminq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34); 56029 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 56030 return __ret; 56031 } 56032 #endif 56033 56034 #ifdef __LITTLE_ENDIAN__ 56035 __ai __attribute__((target("neon"))) int16x8_t vpminq_s16(int16x8_t __p0, int16x8_t __p1) { 56036 int16x8_t __ret; 56037 __ret = (int16x8_t) __builtin_neon_vpminq_v((int8x16_t)__p0, (int8x16_t)__p1, 33); 56038 return __ret; 56039 } 56040 #else 56041 __ai __attribute__((target("neon"))) int16x8_t vpminq_s16(int16x8_t __p0, int16x8_t __p1) { 56042 int16x8_t __ret; 56043 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 56044 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 56045 __ret = (int16x8_t) __builtin_neon_vpminq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33); 56046 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 56047 return __ret; 56048 } 56049 #endif 56050 56051 #ifdef __LITTLE_ENDIAN__ 56052 __ai __attribute__((target("neon"))) float64_t vpminqd_f64(float64x2_t __p0) { 56053 float64_t __ret; 56054 __ret = (float64_t) __builtin_neon_vpminqd_f64(__p0); 56055 return __ret; 56056 } 56057 #else 56058 __ai __attribute__((target("neon"))) float64_t vpminqd_f64(float64x2_t __p0) { 56059 float64_t __ret; 56060 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 56061 __ret = (float64_t) __builtin_neon_vpminqd_f64(__rev0); 56062 return __ret; 56063 } 56064 #endif 56065 56066 #ifdef __LITTLE_ENDIAN__ 56067 __ai __attribute__((target("neon"))) float32_t vpmins_f32(float32x2_t __p0) { 56068 float32_t __ret; 56069 __ret = (float32_t) __builtin_neon_vpmins_f32(__p0); 56070 return __ret; 56071 } 56072 #else 56073 __ai __attribute__((target("neon"))) float32_t vpmins_f32(float32x2_t __p0) { 56074 float32_t __ret; 56075 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 56076 __ret = (float32_t) __builtin_neon_vpmins_f32(__rev0); 56077 return __ret; 56078 } 56079 #endif 56080 56081 #ifdef __LITTLE_ENDIAN__ 56082 __ai __attribute__((target("neon"))) float64x2_t vpminnmq_f64(float64x2_t __p0, float64x2_t __p1) { 56083 float64x2_t __ret; 56084 __ret = (float64x2_t) __builtin_neon_vpminnmq_v((int8x16_t)__p0, (int8x16_t)__p1, 42); 56085 return __ret; 56086 } 56087 #else 56088 __ai __attribute__((target("neon"))) float64x2_t vpminnmq_f64(float64x2_t __p0, float64x2_t __p1) { 56089 float64x2_t __ret; 56090 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 56091 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 56092 __ret = (float64x2_t) __builtin_neon_vpminnmq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 42); 56093 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 56094 return __ret; 56095 } 56096 #endif 56097 56098 #ifdef __LITTLE_ENDIAN__ 56099 __ai __attribute__((target("neon"))) float32x4_t vpminnmq_f32(float32x4_t __p0, float32x4_t __p1) { 56100 float32x4_t __ret; 56101 __ret = (float32x4_t) __builtin_neon_vpminnmq_v((int8x16_t)__p0, (int8x16_t)__p1, 41); 56102 return __ret; 56103 } 56104 #else 56105 __ai __attribute__((target("neon"))) float32x4_t vpminnmq_f32(float32x4_t __p0, float32x4_t __p1) { 56106 float32x4_t __ret; 56107 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 56108 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 56109 __ret = (float32x4_t) __builtin_neon_vpminnmq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 41); 56110 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 56111 return __ret; 56112 } 56113 #endif 56114 56115 #ifdef __LITTLE_ENDIAN__ 56116 __ai __attribute__((target("neon"))) float32x2_t vpminnm_f32(float32x2_t __p0, float32x2_t __p1) { 56117 float32x2_t __ret; 56118 __ret = (float32x2_t) __builtin_neon_vpminnm_v((int8x8_t)__p0, (int8x8_t)__p1, 9); 56119 return __ret; 56120 } 56121 #else 56122 __ai __attribute__((target("neon"))) float32x2_t vpminnm_f32(float32x2_t __p0, float32x2_t __p1) { 56123 float32x2_t __ret; 56124 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 56125 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 56126 __ret = (float32x2_t) __builtin_neon_vpminnm_v((int8x8_t)__rev0, (int8x8_t)__rev1, 9); 56127 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 56128 return __ret; 56129 } 56130 #endif 56131 56132 #ifdef __LITTLE_ENDIAN__ 56133 __ai __attribute__((target("neon"))) float64_t vpminnmqd_f64(float64x2_t __p0) { 56134 float64_t __ret; 56135 __ret = (float64_t) __builtin_neon_vpminnmqd_f64(__p0); 56136 return __ret; 56137 } 56138 #else 56139 __ai __attribute__((target("neon"))) float64_t vpminnmqd_f64(float64x2_t __p0) { 56140 float64_t __ret; 56141 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 56142 __ret = (float64_t) __builtin_neon_vpminnmqd_f64(__rev0); 56143 return __ret; 56144 } 56145 #endif 56146 56147 #ifdef __LITTLE_ENDIAN__ 56148 __ai __attribute__((target("neon"))) float32_t vpminnms_f32(float32x2_t __p0) { 56149 float32_t __ret; 56150 __ret = (float32_t) __builtin_neon_vpminnms_f32(__p0); 56151 return __ret; 56152 } 56153 #else 56154 __ai __attribute__((target("neon"))) float32_t vpminnms_f32(float32x2_t __p0) { 56155 float32_t __ret; 56156 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 56157 __ret = (float32_t) __builtin_neon_vpminnms_f32(__rev0); 56158 return __ret; 56159 } 56160 #endif 56161 56162 #ifdef __LITTLE_ENDIAN__ 56163 __ai __attribute__((target("neon"))) int64x2_t vqabsq_s64(int64x2_t __p0) { 56164 int64x2_t __ret; 56165 __ret = (int64x2_t) __builtin_neon_vqabsq_v((int8x16_t)__p0, 35); 56166 return __ret; 56167 } 56168 #else 56169 __ai __attribute__((target("neon"))) int64x2_t vqabsq_s64(int64x2_t __p0) { 56170 int64x2_t __ret; 56171 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 56172 __ret = (int64x2_t) __builtin_neon_vqabsq_v((int8x16_t)__rev0, 35); 56173 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 56174 return __ret; 56175 } 56176 #endif 56177 56178 __ai __attribute__((target("neon"))) int64x1_t vqabs_s64(int64x1_t __p0) { 56179 int64x1_t __ret; 56180 __ret = (int64x1_t) __builtin_neon_vqabs_v((int8x8_t)__p0, 3); 56181 return __ret; 56182 } 56183 __ai __attribute__((target("neon"))) int8_t vqabsb_s8(int8_t __p0) { 56184 int8_t __ret; 56185 __ret = (int8_t) __builtin_neon_vqabsb_s8(__p0); 56186 return __ret; 56187 } 56188 __ai __attribute__((target("neon"))) int32_t vqabss_s32(int32_t __p0) { 56189 int32_t __ret; 56190 __ret = (int32_t) __builtin_neon_vqabss_s32(__p0); 56191 return __ret; 56192 } 56193 __ai __attribute__((target("neon"))) int64_t vqabsd_s64(int64_t __p0) { 56194 int64_t __ret; 56195 __ret = (int64_t) __builtin_neon_vqabsd_s64(__p0); 56196 return __ret; 56197 } 56198 __ai __attribute__((target("neon"))) int16_t vqabsh_s16(int16_t __p0) { 56199 int16_t __ret; 56200 __ret = (int16_t) __builtin_neon_vqabsh_s16(__p0); 56201 return __ret; 56202 } 56203 __ai __attribute__((target("neon"))) uint8_t vqaddb_u8(uint8_t __p0, uint8_t __p1) { 56204 uint8_t __ret; 56205 __ret = (uint8_t) __builtin_neon_vqaddb_u8(__p0, __p1); 56206 return __ret; 56207 } 56208 __ai __attribute__((target("neon"))) uint32_t vqadds_u32(uint32_t __p0, uint32_t __p1) { 56209 uint32_t __ret; 56210 __ret = (uint32_t) __builtin_neon_vqadds_u32(__p0, __p1); 56211 return __ret; 56212 } 56213 __ai __attribute__((target("neon"))) uint64_t vqaddd_u64(uint64_t __p0, uint64_t __p1) { 56214 uint64_t __ret; 56215 __ret = (uint64_t) __builtin_neon_vqaddd_u64(__p0, __p1); 56216 return __ret; 56217 } 56218 __ai __attribute__((target("neon"))) uint16_t vqaddh_u16(uint16_t __p0, uint16_t __p1) { 56219 uint16_t __ret; 56220 __ret = (uint16_t) __builtin_neon_vqaddh_u16(__p0, __p1); 56221 return __ret; 56222 } 56223 __ai __attribute__((target("neon"))) int8_t vqaddb_s8(int8_t __p0, int8_t __p1) { 56224 int8_t __ret; 56225 __ret = (int8_t) __builtin_neon_vqaddb_s8(__p0, __p1); 56226 return __ret; 56227 } 56228 __ai __attribute__((target("neon"))) int32_t vqadds_s32(int32_t __p0, int32_t __p1) { 56229 int32_t __ret; 56230 __ret = (int32_t) __builtin_neon_vqadds_s32(__p0, __p1); 56231 return __ret; 56232 } 56233 __ai __attribute__((target("neon"))) int64_t vqaddd_s64(int64_t __p0, int64_t __p1) { 56234 int64_t __ret; 56235 __ret = (int64_t) __builtin_neon_vqaddd_s64(__p0, __p1); 56236 return __ret; 56237 } 56238 __ai __attribute__((target("neon"))) int16_t vqaddh_s16(int16_t __p0, int16_t __p1) { 56239 int16_t __ret; 56240 __ret = (int16_t) __builtin_neon_vqaddh_s16(__p0, __p1); 56241 return __ret; 56242 } 56243 __ai __attribute__((target("neon"))) int64_t vqdmlals_s32(int64_t __p0, int32_t __p1, int32_t __p2) { 56244 int64_t __ret; 56245 __ret = (int64_t) __builtin_neon_vqdmlals_s32(__p0, __p1, __p2); 56246 return __ret; 56247 } 56248 __ai __attribute__((target("neon"))) int32_t vqdmlalh_s16(int32_t __p0, int16_t __p1, int16_t __p2) { 56249 int32_t __ret; 56250 __ret = (int32_t) __builtin_neon_vqdmlalh_s16(__p0, __p1, __p2); 56251 return __ret; 56252 } 56253 #ifdef __LITTLE_ENDIAN__ 56254 __ai __attribute__((target("neon"))) int64x2_t vqdmlal_high_s32(int64x2_t __p0, int32x4_t __p1, int32x4_t __p2) { 56255 int64x2_t __ret; 56256 __ret = vqdmlal_s32(__p0, vget_high_s32(__p1), vget_high_s32(__p2)); 56257 return __ret; 56258 } 56259 #else 56260 __ai __attribute__((target("neon"))) int64x2_t vqdmlal_high_s32(int64x2_t __p0, int32x4_t __p1, int32x4_t __p2) { 56261 int64x2_t __ret; 56262 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 56263 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 56264 int32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 56265 __ret = __noswap_vqdmlal_s32(__rev0, __noswap_vget_high_s32(__rev1), __noswap_vget_high_s32(__rev2)); 56266 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 56267 return __ret; 56268 } 56269 #endif 56270 56271 #ifdef __LITTLE_ENDIAN__ 56272 __ai __attribute__((target("neon"))) int32x4_t vqdmlal_high_s16(int32x4_t __p0, int16x8_t __p1, int16x8_t __p2) { 56273 int32x4_t __ret; 56274 __ret = vqdmlal_s16(__p0, vget_high_s16(__p1), vget_high_s16(__p2)); 56275 return __ret; 56276 } 56277 #else 56278 __ai __attribute__((target("neon"))) int32x4_t vqdmlal_high_s16(int32x4_t __p0, int16x8_t __p1, int16x8_t __p2) { 56279 int32x4_t __ret; 56280 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 56281 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 56282 int16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 56283 __ret = __noswap_vqdmlal_s16(__rev0, __noswap_vget_high_s16(__rev1), __noswap_vget_high_s16(__rev2)); 56284 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 56285 return __ret; 56286 } 56287 #endif 56288 56289 #ifdef __LITTLE_ENDIAN__ 56290 #define vqdmlal_high_lane_s32(__p0_628, __p1_628, __p2_628, __p3_628) __extension__ ({ \ 56291 int64x2_t __ret_628; \ 56292 int64x2_t __s0_628 = __p0_628; \ 56293 int32x4_t __s1_628 = __p1_628; \ 56294 int32x2_t __s2_628 = __p2_628; \ 56295 __ret_628 = vqdmlal_s32(__s0_628, vget_high_s32(__s1_628), splat_lane_s32(__s2_628, __p3_628)); \ 56296 __ret_628; \ 56297 }) 56298 #else 56299 #define vqdmlal_high_lane_s32(__p0_629, __p1_629, __p2_629, __p3_629) __extension__ ({ \ 56300 int64x2_t __ret_629; \ 56301 int64x2_t __s0_629 = __p0_629; \ 56302 int32x4_t __s1_629 = __p1_629; \ 56303 int32x2_t __s2_629 = __p2_629; \ 56304 int64x2_t __rev0_629; __rev0_629 = __builtin_shufflevector(__s0_629, __s0_629, 1, 0); \ 56305 int32x4_t __rev1_629; __rev1_629 = __builtin_shufflevector(__s1_629, __s1_629, 3, 2, 1, 0); \ 56306 int32x2_t __rev2_629; __rev2_629 = __builtin_shufflevector(__s2_629, __s2_629, 1, 0); \ 56307 __ret_629 = __noswap_vqdmlal_s32(__rev0_629, __noswap_vget_high_s32(__rev1_629), __noswap_splat_lane_s32(__rev2_629, __p3_629)); \ 56308 __ret_629 = __builtin_shufflevector(__ret_629, __ret_629, 1, 0); \ 56309 __ret_629; \ 56310 }) 56311 #endif 56312 56313 #ifdef __LITTLE_ENDIAN__ 56314 #define vqdmlal_high_lane_s16(__p0_630, __p1_630, __p2_630, __p3_630) __extension__ ({ \ 56315 int32x4_t __ret_630; \ 56316 int32x4_t __s0_630 = __p0_630; \ 56317 int16x8_t __s1_630 = __p1_630; \ 56318 int16x4_t __s2_630 = __p2_630; \ 56319 __ret_630 = vqdmlal_s16(__s0_630, vget_high_s16(__s1_630), splat_lane_s16(__s2_630, __p3_630)); \ 56320 __ret_630; \ 56321 }) 56322 #else 56323 #define vqdmlal_high_lane_s16(__p0_631, __p1_631, __p2_631, __p3_631) __extension__ ({ \ 56324 int32x4_t __ret_631; \ 56325 int32x4_t __s0_631 = __p0_631; \ 56326 int16x8_t __s1_631 = __p1_631; \ 56327 int16x4_t __s2_631 = __p2_631; \ 56328 int32x4_t __rev0_631; __rev0_631 = __builtin_shufflevector(__s0_631, __s0_631, 3, 2, 1, 0); \ 56329 int16x8_t __rev1_631; __rev1_631 = __builtin_shufflevector(__s1_631, __s1_631, 7, 6, 5, 4, 3, 2, 1, 0); \ 56330 int16x4_t __rev2_631; __rev2_631 = __builtin_shufflevector(__s2_631, __s2_631, 3, 2, 1, 0); \ 56331 __ret_631 = __noswap_vqdmlal_s16(__rev0_631, __noswap_vget_high_s16(__rev1_631), __noswap_splat_lane_s16(__rev2_631, __p3_631)); \ 56332 __ret_631 = __builtin_shufflevector(__ret_631, __ret_631, 3, 2, 1, 0); \ 56333 __ret_631; \ 56334 }) 56335 #endif 56336 56337 #ifdef __LITTLE_ENDIAN__ 56338 #define vqdmlal_high_laneq_s32(__p0_632, __p1_632, __p2_632, __p3_632) __extension__ ({ \ 56339 int64x2_t __ret_632; \ 56340 int64x2_t __s0_632 = __p0_632; \ 56341 int32x4_t __s1_632 = __p1_632; \ 56342 int32x4_t __s2_632 = __p2_632; \ 56343 __ret_632 = vqdmlal_s32(__s0_632, vget_high_s32(__s1_632), splat_laneq_s32(__s2_632, __p3_632)); \ 56344 __ret_632; \ 56345 }) 56346 #else 56347 #define vqdmlal_high_laneq_s32(__p0_633, __p1_633, __p2_633, __p3_633) __extension__ ({ \ 56348 int64x2_t __ret_633; \ 56349 int64x2_t __s0_633 = __p0_633; \ 56350 int32x4_t __s1_633 = __p1_633; \ 56351 int32x4_t __s2_633 = __p2_633; \ 56352 int64x2_t __rev0_633; __rev0_633 = __builtin_shufflevector(__s0_633, __s0_633, 1, 0); \ 56353 int32x4_t __rev1_633; __rev1_633 = __builtin_shufflevector(__s1_633, __s1_633, 3, 2, 1, 0); \ 56354 int32x4_t __rev2_633; __rev2_633 = __builtin_shufflevector(__s2_633, __s2_633, 3, 2, 1, 0); \ 56355 __ret_633 = __noswap_vqdmlal_s32(__rev0_633, __noswap_vget_high_s32(__rev1_633), __noswap_splat_laneq_s32(__rev2_633, __p3_633)); \ 56356 __ret_633 = __builtin_shufflevector(__ret_633, __ret_633, 1, 0); \ 56357 __ret_633; \ 56358 }) 56359 #endif 56360 56361 #ifdef __LITTLE_ENDIAN__ 56362 #define vqdmlal_high_laneq_s16(__p0_634, __p1_634, __p2_634, __p3_634) __extension__ ({ \ 56363 int32x4_t __ret_634; \ 56364 int32x4_t __s0_634 = __p0_634; \ 56365 int16x8_t __s1_634 = __p1_634; \ 56366 int16x8_t __s2_634 = __p2_634; \ 56367 __ret_634 = vqdmlal_s16(__s0_634, vget_high_s16(__s1_634), splat_laneq_s16(__s2_634, __p3_634)); \ 56368 __ret_634; \ 56369 }) 56370 #else 56371 #define vqdmlal_high_laneq_s16(__p0_635, __p1_635, __p2_635, __p3_635) __extension__ ({ \ 56372 int32x4_t __ret_635; \ 56373 int32x4_t __s0_635 = __p0_635; \ 56374 int16x8_t __s1_635 = __p1_635; \ 56375 int16x8_t __s2_635 = __p2_635; \ 56376 int32x4_t __rev0_635; __rev0_635 = __builtin_shufflevector(__s0_635, __s0_635, 3, 2, 1, 0); \ 56377 int16x8_t __rev1_635; __rev1_635 = __builtin_shufflevector(__s1_635, __s1_635, 7, 6, 5, 4, 3, 2, 1, 0); \ 56378 int16x8_t __rev2_635; __rev2_635 = __builtin_shufflevector(__s2_635, __s2_635, 7, 6, 5, 4, 3, 2, 1, 0); \ 56379 __ret_635 = __noswap_vqdmlal_s16(__rev0_635, __noswap_vget_high_s16(__rev1_635), __noswap_splat_laneq_s16(__rev2_635, __p3_635)); \ 56380 __ret_635 = __builtin_shufflevector(__ret_635, __ret_635, 3, 2, 1, 0); \ 56381 __ret_635; \ 56382 }) 56383 #endif 56384 56385 #ifdef __LITTLE_ENDIAN__ 56386 __ai __attribute__((target("neon"))) int64x2_t vqdmlal_high_n_s32(int64x2_t __p0, int32x4_t __p1, int32_t __p2) { 56387 int64x2_t __ret; 56388 __ret = vqdmlal_n_s32(__p0, vget_high_s32(__p1), __p2); 56389 return __ret; 56390 } 56391 #else 56392 __ai __attribute__((target("neon"))) int64x2_t vqdmlal_high_n_s32(int64x2_t __p0, int32x4_t __p1, int32_t __p2) { 56393 int64x2_t __ret; 56394 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 56395 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 56396 __ret = __noswap_vqdmlal_n_s32(__rev0, __noswap_vget_high_s32(__rev1), __p2); 56397 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 56398 return __ret; 56399 } 56400 #endif 56401 56402 #ifdef __LITTLE_ENDIAN__ 56403 __ai __attribute__((target("neon"))) int32x4_t vqdmlal_high_n_s16(int32x4_t __p0, int16x8_t __p1, int16_t __p2) { 56404 int32x4_t __ret; 56405 __ret = vqdmlal_n_s16(__p0, vget_high_s16(__p1), __p2); 56406 return __ret; 56407 } 56408 #else 56409 __ai __attribute__((target("neon"))) int32x4_t vqdmlal_high_n_s16(int32x4_t __p0, int16x8_t __p1, int16_t __p2) { 56410 int32x4_t __ret; 56411 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 56412 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 56413 __ret = __noswap_vqdmlal_n_s16(__rev0, __noswap_vget_high_s16(__rev1), __p2); 56414 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 56415 return __ret; 56416 } 56417 #endif 56418 56419 #ifdef __LITTLE_ENDIAN__ 56420 #define vqdmlals_lane_s32(__p0, __p1, __p2, __p3) __extension__ ({ \ 56421 int64_t __ret; \ 56422 int64_t __s0 = __p0; \ 56423 int32_t __s1 = __p1; \ 56424 int32x2_t __s2 = __p2; \ 56425 __ret = (int64_t) __builtin_neon_vqdmlals_lane_s32(__s0, __s1, __s2, __p3); \ 56426 __ret; \ 56427 }) 56428 #else 56429 #define vqdmlals_lane_s32(__p0, __p1, __p2, __p3) __extension__ ({ \ 56430 int64_t __ret; \ 56431 int64_t __s0 = __p0; \ 56432 int32_t __s1 = __p1; \ 56433 int32x2_t __s2 = __p2; \ 56434 int32x2_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 1, 0); \ 56435 __ret = (int64_t) __builtin_neon_vqdmlals_lane_s32(__s0, __s1, __rev2, __p3); \ 56436 __ret; \ 56437 }) 56438 #endif 56439 56440 #ifdef __LITTLE_ENDIAN__ 56441 #define vqdmlalh_lane_s16(__p0, __p1, __p2, __p3) __extension__ ({ \ 56442 int32_t __ret; \ 56443 int32_t __s0 = __p0; \ 56444 int16_t __s1 = __p1; \ 56445 int16x4_t __s2 = __p2; \ 56446 __ret = (int32_t) __builtin_neon_vqdmlalh_lane_s16(__s0, __s1, __s2, __p3); \ 56447 __ret; \ 56448 }) 56449 #else 56450 #define vqdmlalh_lane_s16(__p0, __p1, __p2, __p3) __extension__ ({ \ 56451 int32_t __ret; \ 56452 int32_t __s0 = __p0; \ 56453 int16_t __s1 = __p1; \ 56454 int16x4_t __s2 = __p2; \ 56455 int16x4_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 3, 2, 1, 0); \ 56456 __ret = (int32_t) __builtin_neon_vqdmlalh_lane_s16(__s0, __s1, __rev2, __p3); \ 56457 __ret; \ 56458 }) 56459 #endif 56460 56461 #ifdef __LITTLE_ENDIAN__ 56462 #define vqdmlals_laneq_s32(__p0, __p1, __p2, __p3) __extension__ ({ \ 56463 int64_t __ret; \ 56464 int64_t __s0 = __p0; \ 56465 int32_t __s1 = __p1; \ 56466 int32x4_t __s2 = __p2; \ 56467 __ret = (int64_t) __builtin_neon_vqdmlals_laneq_s32(__s0, __s1, __s2, __p3); \ 56468 __ret; \ 56469 }) 56470 #else 56471 #define vqdmlals_laneq_s32(__p0, __p1, __p2, __p3) __extension__ ({ \ 56472 int64_t __ret; \ 56473 int64_t __s0 = __p0; \ 56474 int32_t __s1 = __p1; \ 56475 int32x4_t __s2 = __p2; \ 56476 int32x4_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 3, 2, 1, 0); \ 56477 __ret = (int64_t) __builtin_neon_vqdmlals_laneq_s32(__s0, __s1, __rev2, __p3); \ 56478 __ret; \ 56479 }) 56480 #endif 56481 56482 #ifdef __LITTLE_ENDIAN__ 56483 #define vqdmlalh_laneq_s16(__p0, __p1, __p2, __p3) __extension__ ({ \ 56484 int32_t __ret; \ 56485 int32_t __s0 = __p0; \ 56486 int16_t __s1 = __p1; \ 56487 int16x8_t __s2 = __p2; \ 56488 __ret = (int32_t) __builtin_neon_vqdmlalh_laneq_s16(__s0, __s1, __s2, __p3); \ 56489 __ret; \ 56490 }) 56491 #else 56492 #define vqdmlalh_laneq_s16(__p0, __p1, __p2, __p3) __extension__ ({ \ 56493 int32_t __ret; \ 56494 int32_t __s0 = __p0; \ 56495 int16_t __s1 = __p1; \ 56496 int16x8_t __s2 = __p2; \ 56497 int16x8_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 7, 6, 5, 4, 3, 2, 1, 0); \ 56498 __ret = (int32_t) __builtin_neon_vqdmlalh_laneq_s16(__s0, __s1, __rev2, __p3); \ 56499 __ret; \ 56500 }) 56501 #endif 56502 56503 #ifdef __LITTLE_ENDIAN__ 56504 #define vqdmlal_laneq_s32(__p0_636, __p1_636, __p2_636, __p3_636) __extension__ ({ \ 56505 int64x2_t __ret_636; \ 56506 int64x2_t __s0_636 = __p0_636; \ 56507 int32x2_t __s1_636 = __p1_636; \ 56508 int32x4_t __s2_636 = __p2_636; \ 56509 __ret_636 = vqdmlal_s32(__s0_636, __s1_636, splat_laneq_s32(__s2_636, __p3_636)); \ 56510 __ret_636; \ 56511 }) 56512 #else 56513 #define vqdmlal_laneq_s32(__p0_637, __p1_637, __p2_637, __p3_637) __extension__ ({ \ 56514 int64x2_t __ret_637; \ 56515 int64x2_t __s0_637 = __p0_637; \ 56516 int32x2_t __s1_637 = __p1_637; \ 56517 int32x4_t __s2_637 = __p2_637; \ 56518 int64x2_t __rev0_637; __rev0_637 = __builtin_shufflevector(__s0_637, __s0_637, 1, 0); \ 56519 int32x2_t __rev1_637; __rev1_637 = __builtin_shufflevector(__s1_637, __s1_637, 1, 0); \ 56520 int32x4_t __rev2_637; __rev2_637 = __builtin_shufflevector(__s2_637, __s2_637, 3, 2, 1, 0); \ 56521 __ret_637 = __noswap_vqdmlal_s32(__rev0_637, __rev1_637, __noswap_splat_laneq_s32(__rev2_637, __p3_637)); \ 56522 __ret_637 = __builtin_shufflevector(__ret_637, __ret_637, 1, 0); \ 56523 __ret_637; \ 56524 }) 56525 #endif 56526 56527 #ifdef __LITTLE_ENDIAN__ 56528 #define vqdmlal_laneq_s16(__p0_638, __p1_638, __p2_638, __p3_638) __extension__ ({ \ 56529 int32x4_t __ret_638; \ 56530 int32x4_t __s0_638 = __p0_638; \ 56531 int16x4_t __s1_638 = __p1_638; \ 56532 int16x8_t __s2_638 = __p2_638; \ 56533 __ret_638 = vqdmlal_s16(__s0_638, __s1_638, splat_laneq_s16(__s2_638, __p3_638)); \ 56534 __ret_638; \ 56535 }) 56536 #else 56537 #define vqdmlal_laneq_s16(__p0_639, __p1_639, __p2_639, __p3_639) __extension__ ({ \ 56538 int32x4_t __ret_639; \ 56539 int32x4_t __s0_639 = __p0_639; \ 56540 int16x4_t __s1_639 = __p1_639; \ 56541 int16x8_t __s2_639 = __p2_639; \ 56542 int32x4_t __rev0_639; __rev0_639 = __builtin_shufflevector(__s0_639, __s0_639, 3, 2, 1, 0); \ 56543 int16x4_t __rev1_639; __rev1_639 = __builtin_shufflevector(__s1_639, __s1_639, 3, 2, 1, 0); \ 56544 int16x8_t __rev2_639; __rev2_639 = __builtin_shufflevector(__s2_639, __s2_639, 7, 6, 5, 4, 3, 2, 1, 0); \ 56545 __ret_639 = __noswap_vqdmlal_s16(__rev0_639, __rev1_639, __noswap_splat_laneq_s16(__rev2_639, __p3_639)); \ 56546 __ret_639 = __builtin_shufflevector(__ret_639, __ret_639, 3, 2, 1, 0); \ 56547 __ret_639; \ 56548 }) 56549 #endif 56550 56551 __ai __attribute__((target("neon"))) int64_t vqdmlsls_s32(int64_t __p0, int32_t __p1, int32_t __p2) { 56552 int64_t __ret; 56553 __ret = (int64_t) __builtin_neon_vqdmlsls_s32(__p0, __p1, __p2); 56554 return __ret; 56555 } 56556 __ai __attribute__((target("neon"))) int32_t vqdmlslh_s16(int32_t __p0, int16_t __p1, int16_t __p2) { 56557 int32_t __ret; 56558 __ret = (int32_t) __builtin_neon_vqdmlslh_s16(__p0, __p1, __p2); 56559 return __ret; 56560 } 56561 #ifdef __LITTLE_ENDIAN__ 56562 __ai __attribute__((target("neon"))) int64x2_t vqdmlsl_high_s32(int64x2_t __p0, int32x4_t __p1, int32x4_t __p2) { 56563 int64x2_t __ret; 56564 __ret = vqdmlsl_s32(__p0, vget_high_s32(__p1), vget_high_s32(__p2)); 56565 return __ret; 56566 } 56567 #else 56568 __ai __attribute__((target("neon"))) int64x2_t vqdmlsl_high_s32(int64x2_t __p0, int32x4_t __p1, int32x4_t __p2) { 56569 int64x2_t __ret; 56570 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 56571 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 56572 int32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 56573 __ret = __noswap_vqdmlsl_s32(__rev0, __noswap_vget_high_s32(__rev1), __noswap_vget_high_s32(__rev2)); 56574 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 56575 return __ret; 56576 } 56577 #endif 56578 56579 #ifdef __LITTLE_ENDIAN__ 56580 __ai __attribute__((target("neon"))) int32x4_t vqdmlsl_high_s16(int32x4_t __p0, int16x8_t __p1, int16x8_t __p2) { 56581 int32x4_t __ret; 56582 __ret = vqdmlsl_s16(__p0, vget_high_s16(__p1), vget_high_s16(__p2)); 56583 return __ret; 56584 } 56585 #else 56586 __ai __attribute__((target("neon"))) int32x4_t vqdmlsl_high_s16(int32x4_t __p0, int16x8_t __p1, int16x8_t __p2) { 56587 int32x4_t __ret; 56588 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 56589 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 56590 int16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 56591 __ret = __noswap_vqdmlsl_s16(__rev0, __noswap_vget_high_s16(__rev1), __noswap_vget_high_s16(__rev2)); 56592 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 56593 return __ret; 56594 } 56595 #endif 56596 56597 #ifdef __LITTLE_ENDIAN__ 56598 #define vqdmlsl_high_lane_s32(__p0_640, __p1_640, __p2_640, __p3_640) __extension__ ({ \ 56599 int64x2_t __ret_640; \ 56600 int64x2_t __s0_640 = __p0_640; \ 56601 int32x4_t __s1_640 = __p1_640; \ 56602 int32x2_t __s2_640 = __p2_640; \ 56603 __ret_640 = vqdmlsl_s32(__s0_640, vget_high_s32(__s1_640), splat_lane_s32(__s2_640, __p3_640)); \ 56604 __ret_640; \ 56605 }) 56606 #else 56607 #define vqdmlsl_high_lane_s32(__p0_641, __p1_641, __p2_641, __p3_641) __extension__ ({ \ 56608 int64x2_t __ret_641; \ 56609 int64x2_t __s0_641 = __p0_641; \ 56610 int32x4_t __s1_641 = __p1_641; \ 56611 int32x2_t __s2_641 = __p2_641; \ 56612 int64x2_t __rev0_641; __rev0_641 = __builtin_shufflevector(__s0_641, __s0_641, 1, 0); \ 56613 int32x4_t __rev1_641; __rev1_641 = __builtin_shufflevector(__s1_641, __s1_641, 3, 2, 1, 0); \ 56614 int32x2_t __rev2_641; __rev2_641 = __builtin_shufflevector(__s2_641, __s2_641, 1, 0); \ 56615 __ret_641 = __noswap_vqdmlsl_s32(__rev0_641, __noswap_vget_high_s32(__rev1_641), __noswap_splat_lane_s32(__rev2_641, __p3_641)); \ 56616 __ret_641 = __builtin_shufflevector(__ret_641, __ret_641, 1, 0); \ 56617 __ret_641; \ 56618 }) 56619 #endif 56620 56621 #ifdef __LITTLE_ENDIAN__ 56622 #define vqdmlsl_high_lane_s16(__p0_642, __p1_642, __p2_642, __p3_642) __extension__ ({ \ 56623 int32x4_t __ret_642; \ 56624 int32x4_t __s0_642 = __p0_642; \ 56625 int16x8_t __s1_642 = __p1_642; \ 56626 int16x4_t __s2_642 = __p2_642; \ 56627 __ret_642 = vqdmlsl_s16(__s0_642, vget_high_s16(__s1_642), splat_lane_s16(__s2_642, __p3_642)); \ 56628 __ret_642; \ 56629 }) 56630 #else 56631 #define vqdmlsl_high_lane_s16(__p0_643, __p1_643, __p2_643, __p3_643) __extension__ ({ \ 56632 int32x4_t __ret_643; \ 56633 int32x4_t __s0_643 = __p0_643; \ 56634 int16x8_t __s1_643 = __p1_643; \ 56635 int16x4_t __s2_643 = __p2_643; \ 56636 int32x4_t __rev0_643; __rev0_643 = __builtin_shufflevector(__s0_643, __s0_643, 3, 2, 1, 0); \ 56637 int16x8_t __rev1_643; __rev1_643 = __builtin_shufflevector(__s1_643, __s1_643, 7, 6, 5, 4, 3, 2, 1, 0); \ 56638 int16x4_t __rev2_643; __rev2_643 = __builtin_shufflevector(__s2_643, __s2_643, 3, 2, 1, 0); \ 56639 __ret_643 = __noswap_vqdmlsl_s16(__rev0_643, __noswap_vget_high_s16(__rev1_643), __noswap_splat_lane_s16(__rev2_643, __p3_643)); \ 56640 __ret_643 = __builtin_shufflevector(__ret_643, __ret_643, 3, 2, 1, 0); \ 56641 __ret_643; \ 56642 }) 56643 #endif 56644 56645 #ifdef __LITTLE_ENDIAN__ 56646 #define vqdmlsl_high_laneq_s32(__p0_644, __p1_644, __p2_644, __p3_644) __extension__ ({ \ 56647 int64x2_t __ret_644; \ 56648 int64x2_t __s0_644 = __p0_644; \ 56649 int32x4_t __s1_644 = __p1_644; \ 56650 int32x4_t __s2_644 = __p2_644; \ 56651 __ret_644 = vqdmlsl_s32(__s0_644, vget_high_s32(__s1_644), splat_laneq_s32(__s2_644, __p3_644)); \ 56652 __ret_644; \ 56653 }) 56654 #else 56655 #define vqdmlsl_high_laneq_s32(__p0_645, __p1_645, __p2_645, __p3_645) __extension__ ({ \ 56656 int64x2_t __ret_645; \ 56657 int64x2_t __s0_645 = __p0_645; \ 56658 int32x4_t __s1_645 = __p1_645; \ 56659 int32x4_t __s2_645 = __p2_645; \ 56660 int64x2_t __rev0_645; __rev0_645 = __builtin_shufflevector(__s0_645, __s0_645, 1, 0); \ 56661 int32x4_t __rev1_645; __rev1_645 = __builtin_shufflevector(__s1_645, __s1_645, 3, 2, 1, 0); \ 56662 int32x4_t __rev2_645; __rev2_645 = __builtin_shufflevector(__s2_645, __s2_645, 3, 2, 1, 0); \ 56663 __ret_645 = __noswap_vqdmlsl_s32(__rev0_645, __noswap_vget_high_s32(__rev1_645), __noswap_splat_laneq_s32(__rev2_645, __p3_645)); \ 56664 __ret_645 = __builtin_shufflevector(__ret_645, __ret_645, 1, 0); \ 56665 __ret_645; \ 56666 }) 56667 #endif 56668 56669 #ifdef __LITTLE_ENDIAN__ 56670 #define vqdmlsl_high_laneq_s16(__p0_646, __p1_646, __p2_646, __p3_646) __extension__ ({ \ 56671 int32x4_t __ret_646; \ 56672 int32x4_t __s0_646 = __p0_646; \ 56673 int16x8_t __s1_646 = __p1_646; \ 56674 int16x8_t __s2_646 = __p2_646; \ 56675 __ret_646 = vqdmlsl_s16(__s0_646, vget_high_s16(__s1_646), splat_laneq_s16(__s2_646, __p3_646)); \ 56676 __ret_646; \ 56677 }) 56678 #else 56679 #define vqdmlsl_high_laneq_s16(__p0_647, __p1_647, __p2_647, __p3_647) __extension__ ({ \ 56680 int32x4_t __ret_647; \ 56681 int32x4_t __s0_647 = __p0_647; \ 56682 int16x8_t __s1_647 = __p1_647; \ 56683 int16x8_t __s2_647 = __p2_647; \ 56684 int32x4_t __rev0_647; __rev0_647 = __builtin_shufflevector(__s0_647, __s0_647, 3, 2, 1, 0); \ 56685 int16x8_t __rev1_647; __rev1_647 = __builtin_shufflevector(__s1_647, __s1_647, 7, 6, 5, 4, 3, 2, 1, 0); \ 56686 int16x8_t __rev2_647; __rev2_647 = __builtin_shufflevector(__s2_647, __s2_647, 7, 6, 5, 4, 3, 2, 1, 0); \ 56687 __ret_647 = __noswap_vqdmlsl_s16(__rev0_647, __noswap_vget_high_s16(__rev1_647), __noswap_splat_laneq_s16(__rev2_647, __p3_647)); \ 56688 __ret_647 = __builtin_shufflevector(__ret_647, __ret_647, 3, 2, 1, 0); \ 56689 __ret_647; \ 56690 }) 56691 #endif 56692 56693 #ifdef __LITTLE_ENDIAN__ 56694 __ai __attribute__((target("neon"))) int64x2_t vqdmlsl_high_n_s32(int64x2_t __p0, int32x4_t __p1, int32_t __p2) { 56695 int64x2_t __ret; 56696 __ret = vqdmlsl_n_s32(__p0, vget_high_s32(__p1), __p2); 56697 return __ret; 56698 } 56699 #else 56700 __ai __attribute__((target("neon"))) int64x2_t vqdmlsl_high_n_s32(int64x2_t __p0, int32x4_t __p1, int32_t __p2) { 56701 int64x2_t __ret; 56702 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 56703 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 56704 __ret = __noswap_vqdmlsl_n_s32(__rev0, __noswap_vget_high_s32(__rev1), __p2); 56705 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 56706 return __ret; 56707 } 56708 #endif 56709 56710 #ifdef __LITTLE_ENDIAN__ 56711 __ai __attribute__((target("neon"))) int32x4_t vqdmlsl_high_n_s16(int32x4_t __p0, int16x8_t __p1, int16_t __p2) { 56712 int32x4_t __ret; 56713 __ret = vqdmlsl_n_s16(__p0, vget_high_s16(__p1), __p2); 56714 return __ret; 56715 } 56716 #else 56717 __ai __attribute__((target("neon"))) int32x4_t vqdmlsl_high_n_s16(int32x4_t __p0, int16x8_t __p1, int16_t __p2) { 56718 int32x4_t __ret; 56719 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 56720 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 56721 __ret = __noswap_vqdmlsl_n_s16(__rev0, __noswap_vget_high_s16(__rev1), __p2); 56722 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 56723 return __ret; 56724 } 56725 #endif 56726 56727 #ifdef __LITTLE_ENDIAN__ 56728 #define vqdmlsls_lane_s32(__p0, __p1, __p2, __p3) __extension__ ({ \ 56729 int64_t __ret; \ 56730 int64_t __s0 = __p0; \ 56731 int32_t __s1 = __p1; \ 56732 int32x2_t __s2 = __p2; \ 56733 __ret = (int64_t) __builtin_neon_vqdmlsls_lane_s32(__s0, __s1, __s2, __p3); \ 56734 __ret; \ 56735 }) 56736 #else 56737 #define vqdmlsls_lane_s32(__p0, __p1, __p2, __p3) __extension__ ({ \ 56738 int64_t __ret; \ 56739 int64_t __s0 = __p0; \ 56740 int32_t __s1 = __p1; \ 56741 int32x2_t __s2 = __p2; \ 56742 int32x2_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 1, 0); \ 56743 __ret = (int64_t) __builtin_neon_vqdmlsls_lane_s32(__s0, __s1, __rev2, __p3); \ 56744 __ret; \ 56745 }) 56746 #endif 56747 56748 #ifdef __LITTLE_ENDIAN__ 56749 #define vqdmlslh_lane_s16(__p0, __p1, __p2, __p3) __extension__ ({ \ 56750 int32_t __ret; \ 56751 int32_t __s0 = __p0; \ 56752 int16_t __s1 = __p1; \ 56753 int16x4_t __s2 = __p2; \ 56754 __ret = (int32_t) __builtin_neon_vqdmlslh_lane_s16(__s0, __s1, __s2, __p3); \ 56755 __ret; \ 56756 }) 56757 #else 56758 #define vqdmlslh_lane_s16(__p0, __p1, __p2, __p3) __extension__ ({ \ 56759 int32_t __ret; \ 56760 int32_t __s0 = __p0; \ 56761 int16_t __s1 = __p1; \ 56762 int16x4_t __s2 = __p2; \ 56763 int16x4_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 3, 2, 1, 0); \ 56764 __ret = (int32_t) __builtin_neon_vqdmlslh_lane_s16(__s0, __s1, __rev2, __p3); \ 56765 __ret; \ 56766 }) 56767 #endif 56768 56769 #ifdef __LITTLE_ENDIAN__ 56770 #define vqdmlsls_laneq_s32(__p0, __p1, __p2, __p3) __extension__ ({ \ 56771 int64_t __ret; \ 56772 int64_t __s0 = __p0; \ 56773 int32_t __s1 = __p1; \ 56774 int32x4_t __s2 = __p2; \ 56775 __ret = (int64_t) __builtin_neon_vqdmlsls_laneq_s32(__s0, __s1, __s2, __p3); \ 56776 __ret; \ 56777 }) 56778 #else 56779 #define vqdmlsls_laneq_s32(__p0, __p1, __p2, __p3) __extension__ ({ \ 56780 int64_t __ret; \ 56781 int64_t __s0 = __p0; \ 56782 int32_t __s1 = __p1; \ 56783 int32x4_t __s2 = __p2; \ 56784 int32x4_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 3, 2, 1, 0); \ 56785 __ret = (int64_t) __builtin_neon_vqdmlsls_laneq_s32(__s0, __s1, __rev2, __p3); \ 56786 __ret; \ 56787 }) 56788 #endif 56789 56790 #ifdef __LITTLE_ENDIAN__ 56791 #define vqdmlslh_laneq_s16(__p0, __p1, __p2, __p3) __extension__ ({ \ 56792 int32_t __ret; \ 56793 int32_t __s0 = __p0; \ 56794 int16_t __s1 = __p1; \ 56795 int16x8_t __s2 = __p2; \ 56796 __ret = (int32_t) __builtin_neon_vqdmlslh_laneq_s16(__s0, __s1, __s2, __p3); \ 56797 __ret; \ 56798 }) 56799 #else 56800 #define vqdmlslh_laneq_s16(__p0, __p1, __p2, __p3) __extension__ ({ \ 56801 int32_t __ret; \ 56802 int32_t __s0 = __p0; \ 56803 int16_t __s1 = __p1; \ 56804 int16x8_t __s2 = __p2; \ 56805 int16x8_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 7, 6, 5, 4, 3, 2, 1, 0); \ 56806 __ret = (int32_t) __builtin_neon_vqdmlslh_laneq_s16(__s0, __s1, __rev2, __p3); \ 56807 __ret; \ 56808 }) 56809 #endif 56810 56811 #ifdef __LITTLE_ENDIAN__ 56812 #define vqdmlsl_laneq_s32(__p0_648, __p1_648, __p2_648, __p3_648) __extension__ ({ \ 56813 int64x2_t __ret_648; \ 56814 int64x2_t __s0_648 = __p0_648; \ 56815 int32x2_t __s1_648 = __p1_648; \ 56816 int32x4_t __s2_648 = __p2_648; \ 56817 __ret_648 = vqdmlsl_s32(__s0_648, __s1_648, splat_laneq_s32(__s2_648, __p3_648)); \ 56818 __ret_648; \ 56819 }) 56820 #else 56821 #define vqdmlsl_laneq_s32(__p0_649, __p1_649, __p2_649, __p3_649) __extension__ ({ \ 56822 int64x2_t __ret_649; \ 56823 int64x2_t __s0_649 = __p0_649; \ 56824 int32x2_t __s1_649 = __p1_649; \ 56825 int32x4_t __s2_649 = __p2_649; \ 56826 int64x2_t __rev0_649; __rev0_649 = __builtin_shufflevector(__s0_649, __s0_649, 1, 0); \ 56827 int32x2_t __rev1_649; __rev1_649 = __builtin_shufflevector(__s1_649, __s1_649, 1, 0); \ 56828 int32x4_t __rev2_649; __rev2_649 = __builtin_shufflevector(__s2_649, __s2_649, 3, 2, 1, 0); \ 56829 __ret_649 = __noswap_vqdmlsl_s32(__rev0_649, __rev1_649, __noswap_splat_laneq_s32(__rev2_649, __p3_649)); \ 56830 __ret_649 = __builtin_shufflevector(__ret_649, __ret_649, 1, 0); \ 56831 __ret_649; \ 56832 }) 56833 #endif 56834 56835 #ifdef __LITTLE_ENDIAN__ 56836 #define vqdmlsl_laneq_s16(__p0_650, __p1_650, __p2_650, __p3_650) __extension__ ({ \ 56837 int32x4_t __ret_650; \ 56838 int32x4_t __s0_650 = __p0_650; \ 56839 int16x4_t __s1_650 = __p1_650; \ 56840 int16x8_t __s2_650 = __p2_650; \ 56841 __ret_650 = vqdmlsl_s16(__s0_650, __s1_650, splat_laneq_s16(__s2_650, __p3_650)); \ 56842 __ret_650; \ 56843 }) 56844 #else 56845 #define vqdmlsl_laneq_s16(__p0_651, __p1_651, __p2_651, __p3_651) __extension__ ({ \ 56846 int32x4_t __ret_651; \ 56847 int32x4_t __s0_651 = __p0_651; \ 56848 int16x4_t __s1_651 = __p1_651; \ 56849 int16x8_t __s2_651 = __p2_651; \ 56850 int32x4_t __rev0_651; __rev0_651 = __builtin_shufflevector(__s0_651, __s0_651, 3, 2, 1, 0); \ 56851 int16x4_t __rev1_651; __rev1_651 = __builtin_shufflevector(__s1_651, __s1_651, 3, 2, 1, 0); \ 56852 int16x8_t __rev2_651; __rev2_651 = __builtin_shufflevector(__s2_651, __s2_651, 7, 6, 5, 4, 3, 2, 1, 0); \ 56853 __ret_651 = __noswap_vqdmlsl_s16(__rev0_651, __rev1_651, __noswap_splat_laneq_s16(__rev2_651, __p3_651)); \ 56854 __ret_651 = __builtin_shufflevector(__ret_651, __ret_651, 3, 2, 1, 0); \ 56855 __ret_651; \ 56856 }) 56857 #endif 56858 56859 __ai __attribute__((target("neon"))) int32_t vqdmulhs_s32(int32_t __p0, int32_t __p1) { 56860 int32_t __ret; 56861 __ret = (int32_t) __builtin_neon_vqdmulhs_s32(__p0, __p1); 56862 return __ret; 56863 } 56864 __ai __attribute__((target("neon"))) int16_t vqdmulhh_s16(int16_t __p0, int16_t __p1) { 56865 int16_t __ret; 56866 __ret = (int16_t) __builtin_neon_vqdmulhh_s16(__p0, __p1); 56867 return __ret; 56868 } 56869 #ifdef __LITTLE_ENDIAN__ 56870 #define vqdmulhq_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 56871 int32x4_t __ret; \ 56872 int32x4_t __s0 = __p0; \ 56873 int32x2_t __s1 = __p1; \ 56874 __ret = (int32x4_t) __builtin_neon_vqdmulhq_lane_v((int8x16_t)__s0, (int8x8_t)__s1, __p2, 2); \ 56875 __ret; \ 56876 }) 56877 #else 56878 #define vqdmulhq_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 56879 int32x4_t __ret; \ 56880 int32x4_t __s0 = __p0; \ 56881 int32x2_t __s1 = __p1; \ 56882 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 56883 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 56884 __ret = (int32x4_t) __builtin_neon_vqdmulhq_lane_v((int8x16_t)__rev0, (int8x8_t)__rev1, __p2, 2); \ 56885 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 56886 __ret; \ 56887 }) 56888 #endif 56889 56890 #ifdef __LITTLE_ENDIAN__ 56891 #define vqdmulhq_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 56892 int16x8_t __ret; \ 56893 int16x8_t __s0 = __p0; \ 56894 int16x4_t __s1 = __p1; \ 56895 __ret = (int16x8_t) __builtin_neon_vqdmulhq_lane_v((int8x16_t)__s0, (int8x8_t)__s1, __p2, 1); \ 56896 __ret; \ 56897 }) 56898 #else 56899 #define vqdmulhq_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 56900 int16x8_t __ret; \ 56901 int16x8_t __s0 = __p0; \ 56902 int16x4_t __s1 = __p1; \ 56903 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 56904 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 56905 __ret = (int16x8_t) __builtin_neon_vqdmulhq_lane_v((int8x16_t)__rev0, (int8x8_t)__rev1, __p2, 1); \ 56906 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 56907 __ret; \ 56908 }) 56909 #endif 56910 56911 #ifdef __LITTLE_ENDIAN__ 56912 #define vqdmulh_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 56913 int32x2_t __ret; \ 56914 int32x2_t __s0 = __p0; \ 56915 int32x2_t __s1 = __p1; \ 56916 __ret = (int32x2_t) __builtin_neon_vqdmulh_lane_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 2); \ 56917 __ret; \ 56918 }) 56919 #else 56920 #define vqdmulh_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 56921 int32x2_t __ret; \ 56922 int32x2_t __s0 = __p0; \ 56923 int32x2_t __s1 = __p1; \ 56924 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 56925 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 56926 __ret = (int32x2_t) __builtin_neon_vqdmulh_lane_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 2); \ 56927 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 56928 __ret; \ 56929 }) 56930 #endif 56931 56932 #ifdef __LITTLE_ENDIAN__ 56933 #define vqdmulh_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 56934 int16x4_t __ret; \ 56935 int16x4_t __s0 = __p0; \ 56936 int16x4_t __s1 = __p1; \ 56937 __ret = (int16x4_t) __builtin_neon_vqdmulh_lane_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 1); \ 56938 __ret; \ 56939 }) 56940 #else 56941 #define vqdmulh_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 56942 int16x4_t __ret; \ 56943 int16x4_t __s0 = __p0; \ 56944 int16x4_t __s1 = __p1; \ 56945 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 56946 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 56947 __ret = (int16x4_t) __builtin_neon_vqdmulh_lane_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 1); \ 56948 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 56949 __ret; \ 56950 }) 56951 #endif 56952 56953 #ifdef __LITTLE_ENDIAN__ 56954 #define vqdmulhs_lane_s32(__p0_652, __p1_652, __p2_652) __extension__ ({ \ 56955 int32_t __ret_652; \ 56956 int32_t __s0_652 = __p0_652; \ 56957 int32x2_t __s1_652 = __p1_652; \ 56958 __ret_652 = vqdmulhs_s32(__s0_652, vget_lane_s32(__s1_652, __p2_652)); \ 56959 __ret_652; \ 56960 }) 56961 #else 56962 #define vqdmulhs_lane_s32(__p0_653, __p1_653, __p2_653) __extension__ ({ \ 56963 int32_t __ret_653; \ 56964 int32_t __s0_653 = __p0_653; \ 56965 int32x2_t __s1_653 = __p1_653; \ 56966 int32x2_t __rev1_653; __rev1_653 = __builtin_shufflevector(__s1_653, __s1_653, 1, 0); \ 56967 __ret_653 = vqdmulhs_s32(__s0_653, __noswap_vget_lane_s32(__rev1_653, __p2_653)); \ 56968 __ret_653; \ 56969 }) 56970 #endif 56971 56972 #ifdef __LITTLE_ENDIAN__ 56973 #define vqdmulhh_lane_s16(__p0_654, __p1_654, __p2_654) __extension__ ({ \ 56974 int16_t __ret_654; \ 56975 int16_t __s0_654 = __p0_654; \ 56976 int16x4_t __s1_654 = __p1_654; \ 56977 __ret_654 = vqdmulhh_s16(__s0_654, vget_lane_s16(__s1_654, __p2_654)); \ 56978 __ret_654; \ 56979 }) 56980 #else 56981 #define vqdmulhh_lane_s16(__p0_655, __p1_655, __p2_655) __extension__ ({ \ 56982 int16_t __ret_655; \ 56983 int16_t __s0_655 = __p0_655; \ 56984 int16x4_t __s1_655 = __p1_655; \ 56985 int16x4_t __rev1_655; __rev1_655 = __builtin_shufflevector(__s1_655, __s1_655, 3, 2, 1, 0); \ 56986 __ret_655 = vqdmulhh_s16(__s0_655, __noswap_vget_lane_s16(__rev1_655, __p2_655)); \ 56987 __ret_655; \ 56988 }) 56989 #endif 56990 56991 #ifdef __LITTLE_ENDIAN__ 56992 #define vqdmulhs_laneq_s32(__p0_656, __p1_656, __p2_656) __extension__ ({ \ 56993 int32_t __ret_656; \ 56994 int32_t __s0_656 = __p0_656; \ 56995 int32x4_t __s1_656 = __p1_656; \ 56996 __ret_656 = vqdmulhs_s32(__s0_656, vgetq_lane_s32(__s1_656, __p2_656)); \ 56997 __ret_656; \ 56998 }) 56999 #else 57000 #define vqdmulhs_laneq_s32(__p0_657, __p1_657, __p2_657) __extension__ ({ \ 57001 int32_t __ret_657; \ 57002 int32_t __s0_657 = __p0_657; \ 57003 int32x4_t __s1_657 = __p1_657; \ 57004 int32x4_t __rev1_657; __rev1_657 = __builtin_shufflevector(__s1_657, __s1_657, 3, 2, 1, 0); \ 57005 __ret_657 = vqdmulhs_s32(__s0_657, __noswap_vgetq_lane_s32(__rev1_657, __p2_657)); \ 57006 __ret_657; \ 57007 }) 57008 #endif 57009 57010 #ifdef __LITTLE_ENDIAN__ 57011 #define vqdmulhh_laneq_s16(__p0_658, __p1_658, __p2_658) __extension__ ({ \ 57012 int16_t __ret_658; \ 57013 int16_t __s0_658 = __p0_658; \ 57014 int16x8_t __s1_658 = __p1_658; \ 57015 __ret_658 = vqdmulhh_s16(__s0_658, vgetq_lane_s16(__s1_658, __p2_658)); \ 57016 __ret_658; \ 57017 }) 57018 #else 57019 #define vqdmulhh_laneq_s16(__p0_659, __p1_659, __p2_659) __extension__ ({ \ 57020 int16_t __ret_659; \ 57021 int16_t __s0_659 = __p0_659; \ 57022 int16x8_t __s1_659 = __p1_659; \ 57023 int16x8_t __rev1_659; __rev1_659 = __builtin_shufflevector(__s1_659, __s1_659, 7, 6, 5, 4, 3, 2, 1, 0); \ 57024 __ret_659 = vqdmulhh_s16(__s0_659, __noswap_vgetq_lane_s16(__rev1_659, __p2_659)); \ 57025 __ret_659; \ 57026 }) 57027 #endif 57028 57029 #ifdef __LITTLE_ENDIAN__ 57030 #define vqdmulhq_laneq_s32(__p0, __p1, __p2) __extension__ ({ \ 57031 int32x4_t __ret; \ 57032 int32x4_t __s0 = __p0; \ 57033 int32x4_t __s1 = __p1; \ 57034 __ret = (int32x4_t) __builtin_neon_vqdmulhq_laneq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 34); \ 57035 __ret; \ 57036 }) 57037 #else 57038 #define vqdmulhq_laneq_s32(__p0, __p1, __p2) __extension__ ({ \ 57039 int32x4_t __ret; \ 57040 int32x4_t __s0 = __p0; \ 57041 int32x4_t __s1 = __p1; \ 57042 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 57043 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 57044 __ret = (int32x4_t) __builtin_neon_vqdmulhq_laneq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 34); \ 57045 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 57046 __ret; \ 57047 }) 57048 #endif 57049 57050 #ifdef __LITTLE_ENDIAN__ 57051 #define vqdmulhq_laneq_s16(__p0, __p1, __p2) __extension__ ({ \ 57052 int16x8_t __ret; \ 57053 int16x8_t __s0 = __p0; \ 57054 int16x8_t __s1 = __p1; \ 57055 __ret = (int16x8_t) __builtin_neon_vqdmulhq_laneq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 33); \ 57056 __ret; \ 57057 }) 57058 #else 57059 #define vqdmulhq_laneq_s16(__p0, __p1, __p2) __extension__ ({ \ 57060 int16x8_t __ret; \ 57061 int16x8_t __s0 = __p0; \ 57062 int16x8_t __s1 = __p1; \ 57063 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 57064 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 57065 __ret = (int16x8_t) __builtin_neon_vqdmulhq_laneq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 33); \ 57066 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 57067 __ret; \ 57068 }) 57069 #endif 57070 57071 #ifdef __LITTLE_ENDIAN__ 57072 #define vqdmulh_laneq_s32(__p0, __p1, __p2) __extension__ ({ \ 57073 int32x2_t __ret; \ 57074 int32x2_t __s0 = __p0; \ 57075 int32x4_t __s1 = __p1; \ 57076 __ret = (int32x2_t) __builtin_neon_vqdmulh_laneq_v((int8x8_t)__s0, (int8x16_t)__s1, __p2, 2); \ 57077 __ret; \ 57078 }) 57079 #else 57080 #define vqdmulh_laneq_s32(__p0, __p1, __p2) __extension__ ({ \ 57081 int32x2_t __ret; \ 57082 int32x2_t __s0 = __p0; \ 57083 int32x4_t __s1 = __p1; \ 57084 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 57085 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 57086 __ret = (int32x2_t) __builtin_neon_vqdmulh_laneq_v((int8x8_t)__rev0, (int8x16_t)__rev1, __p2, 2); \ 57087 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 57088 __ret; \ 57089 }) 57090 #endif 57091 57092 #ifdef __LITTLE_ENDIAN__ 57093 #define vqdmulh_laneq_s16(__p0, __p1, __p2) __extension__ ({ \ 57094 int16x4_t __ret; \ 57095 int16x4_t __s0 = __p0; \ 57096 int16x8_t __s1 = __p1; \ 57097 __ret = (int16x4_t) __builtin_neon_vqdmulh_laneq_v((int8x8_t)__s0, (int8x16_t)__s1, __p2, 1); \ 57098 __ret; \ 57099 }) 57100 #else 57101 #define vqdmulh_laneq_s16(__p0, __p1, __p2) __extension__ ({ \ 57102 int16x4_t __ret; \ 57103 int16x4_t __s0 = __p0; \ 57104 int16x8_t __s1 = __p1; \ 57105 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 57106 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 57107 __ret = (int16x4_t) __builtin_neon_vqdmulh_laneq_v((int8x8_t)__rev0, (int8x16_t)__rev1, __p2, 1); \ 57108 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 57109 __ret; \ 57110 }) 57111 #endif 57112 57113 __ai __attribute__((target("neon"))) int64_t vqdmulls_s32(int32_t __p0, int32_t __p1) { 57114 int64_t __ret; 57115 __ret = (int64_t) __builtin_neon_vqdmulls_s32(__p0, __p1); 57116 return __ret; 57117 } 57118 __ai __attribute__((target("neon"))) int32_t vqdmullh_s16(int16_t __p0, int16_t __p1) { 57119 int32_t __ret; 57120 __ret = (int32_t) __builtin_neon_vqdmullh_s16(__p0, __p1); 57121 return __ret; 57122 } 57123 #ifdef __LITTLE_ENDIAN__ 57124 __ai __attribute__((target("neon"))) int64x2_t vqdmull_high_s32(int32x4_t __p0, int32x4_t __p1) { 57125 int64x2_t __ret; 57126 __ret = vqdmull_s32(vget_high_s32(__p0), vget_high_s32(__p1)); 57127 return __ret; 57128 } 57129 #else 57130 __ai __attribute__((target("neon"))) int64x2_t vqdmull_high_s32(int32x4_t __p0, int32x4_t __p1) { 57131 int64x2_t __ret; 57132 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 57133 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 57134 __ret = __noswap_vqdmull_s32(__noswap_vget_high_s32(__rev0), __noswap_vget_high_s32(__rev1)); 57135 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 57136 return __ret; 57137 } 57138 #endif 57139 57140 #ifdef __LITTLE_ENDIAN__ 57141 __ai __attribute__((target("neon"))) int32x4_t vqdmull_high_s16(int16x8_t __p0, int16x8_t __p1) { 57142 int32x4_t __ret; 57143 __ret = vqdmull_s16(vget_high_s16(__p0), vget_high_s16(__p1)); 57144 return __ret; 57145 } 57146 #else 57147 __ai __attribute__((target("neon"))) int32x4_t vqdmull_high_s16(int16x8_t __p0, int16x8_t __p1) { 57148 int32x4_t __ret; 57149 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 57150 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 57151 __ret = __noswap_vqdmull_s16(__noswap_vget_high_s16(__rev0), __noswap_vget_high_s16(__rev1)); 57152 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 57153 return __ret; 57154 } 57155 #endif 57156 57157 #ifdef __LITTLE_ENDIAN__ 57158 #define vqdmull_high_lane_s32(__p0_660, __p1_660, __p2_660) __extension__ ({ \ 57159 int64x2_t __ret_660; \ 57160 int32x4_t __s0_660 = __p0_660; \ 57161 int32x2_t __s1_660 = __p1_660; \ 57162 __ret_660 = vqdmull_s32(vget_high_s32(__s0_660), splat_lane_s32(__s1_660, __p2_660)); \ 57163 __ret_660; \ 57164 }) 57165 #else 57166 #define vqdmull_high_lane_s32(__p0_661, __p1_661, __p2_661) __extension__ ({ \ 57167 int64x2_t __ret_661; \ 57168 int32x4_t __s0_661 = __p0_661; \ 57169 int32x2_t __s1_661 = __p1_661; \ 57170 int32x4_t __rev0_661; __rev0_661 = __builtin_shufflevector(__s0_661, __s0_661, 3, 2, 1, 0); \ 57171 int32x2_t __rev1_661; __rev1_661 = __builtin_shufflevector(__s1_661, __s1_661, 1, 0); \ 57172 __ret_661 = __noswap_vqdmull_s32(__noswap_vget_high_s32(__rev0_661), __noswap_splat_lane_s32(__rev1_661, __p2_661)); \ 57173 __ret_661 = __builtin_shufflevector(__ret_661, __ret_661, 1, 0); \ 57174 __ret_661; \ 57175 }) 57176 #endif 57177 57178 #ifdef __LITTLE_ENDIAN__ 57179 #define vqdmull_high_lane_s16(__p0_662, __p1_662, __p2_662) __extension__ ({ \ 57180 int32x4_t __ret_662; \ 57181 int16x8_t __s0_662 = __p0_662; \ 57182 int16x4_t __s1_662 = __p1_662; \ 57183 __ret_662 = vqdmull_s16(vget_high_s16(__s0_662), splat_lane_s16(__s1_662, __p2_662)); \ 57184 __ret_662; \ 57185 }) 57186 #else 57187 #define vqdmull_high_lane_s16(__p0_663, __p1_663, __p2_663) __extension__ ({ \ 57188 int32x4_t __ret_663; \ 57189 int16x8_t __s0_663 = __p0_663; \ 57190 int16x4_t __s1_663 = __p1_663; \ 57191 int16x8_t __rev0_663; __rev0_663 = __builtin_shufflevector(__s0_663, __s0_663, 7, 6, 5, 4, 3, 2, 1, 0); \ 57192 int16x4_t __rev1_663; __rev1_663 = __builtin_shufflevector(__s1_663, __s1_663, 3, 2, 1, 0); \ 57193 __ret_663 = __noswap_vqdmull_s16(__noswap_vget_high_s16(__rev0_663), __noswap_splat_lane_s16(__rev1_663, __p2_663)); \ 57194 __ret_663 = __builtin_shufflevector(__ret_663, __ret_663, 3, 2, 1, 0); \ 57195 __ret_663; \ 57196 }) 57197 #endif 57198 57199 #ifdef __LITTLE_ENDIAN__ 57200 #define vqdmull_high_laneq_s32(__p0_664, __p1_664, __p2_664) __extension__ ({ \ 57201 int64x2_t __ret_664; \ 57202 int32x4_t __s0_664 = __p0_664; \ 57203 int32x4_t __s1_664 = __p1_664; \ 57204 __ret_664 = vqdmull_s32(vget_high_s32(__s0_664), splat_laneq_s32(__s1_664, __p2_664)); \ 57205 __ret_664; \ 57206 }) 57207 #else 57208 #define vqdmull_high_laneq_s32(__p0_665, __p1_665, __p2_665) __extension__ ({ \ 57209 int64x2_t __ret_665; \ 57210 int32x4_t __s0_665 = __p0_665; \ 57211 int32x4_t __s1_665 = __p1_665; \ 57212 int32x4_t __rev0_665; __rev0_665 = __builtin_shufflevector(__s0_665, __s0_665, 3, 2, 1, 0); \ 57213 int32x4_t __rev1_665; __rev1_665 = __builtin_shufflevector(__s1_665, __s1_665, 3, 2, 1, 0); \ 57214 __ret_665 = __noswap_vqdmull_s32(__noswap_vget_high_s32(__rev0_665), __noswap_splat_laneq_s32(__rev1_665, __p2_665)); \ 57215 __ret_665 = __builtin_shufflevector(__ret_665, __ret_665, 1, 0); \ 57216 __ret_665; \ 57217 }) 57218 #endif 57219 57220 #ifdef __LITTLE_ENDIAN__ 57221 #define vqdmull_high_laneq_s16(__p0_666, __p1_666, __p2_666) __extension__ ({ \ 57222 int32x4_t __ret_666; \ 57223 int16x8_t __s0_666 = __p0_666; \ 57224 int16x8_t __s1_666 = __p1_666; \ 57225 __ret_666 = vqdmull_s16(vget_high_s16(__s0_666), splat_laneq_s16(__s1_666, __p2_666)); \ 57226 __ret_666; \ 57227 }) 57228 #else 57229 #define vqdmull_high_laneq_s16(__p0_667, __p1_667, __p2_667) __extension__ ({ \ 57230 int32x4_t __ret_667; \ 57231 int16x8_t __s0_667 = __p0_667; \ 57232 int16x8_t __s1_667 = __p1_667; \ 57233 int16x8_t __rev0_667; __rev0_667 = __builtin_shufflevector(__s0_667, __s0_667, 7, 6, 5, 4, 3, 2, 1, 0); \ 57234 int16x8_t __rev1_667; __rev1_667 = __builtin_shufflevector(__s1_667, __s1_667, 7, 6, 5, 4, 3, 2, 1, 0); \ 57235 __ret_667 = __noswap_vqdmull_s16(__noswap_vget_high_s16(__rev0_667), __noswap_splat_laneq_s16(__rev1_667, __p2_667)); \ 57236 __ret_667 = __builtin_shufflevector(__ret_667, __ret_667, 3, 2, 1, 0); \ 57237 __ret_667; \ 57238 }) 57239 #endif 57240 57241 #ifdef __LITTLE_ENDIAN__ 57242 __ai __attribute__((target("neon"))) int64x2_t vqdmull_high_n_s32(int32x4_t __p0, int32_t __p1) { 57243 int64x2_t __ret; 57244 __ret = vqdmull_n_s32(vget_high_s32(__p0), __p1); 57245 return __ret; 57246 } 57247 #else 57248 __ai __attribute__((target("neon"))) int64x2_t vqdmull_high_n_s32(int32x4_t __p0, int32_t __p1) { 57249 int64x2_t __ret; 57250 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 57251 __ret = __noswap_vqdmull_n_s32(__noswap_vget_high_s32(__rev0), __p1); 57252 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 57253 return __ret; 57254 } 57255 #endif 57256 57257 #ifdef __LITTLE_ENDIAN__ 57258 __ai __attribute__((target("neon"))) int32x4_t vqdmull_high_n_s16(int16x8_t __p0, int16_t __p1) { 57259 int32x4_t __ret; 57260 __ret = vqdmull_n_s16(vget_high_s16(__p0), __p1); 57261 return __ret; 57262 } 57263 #else 57264 __ai __attribute__((target("neon"))) int32x4_t vqdmull_high_n_s16(int16x8_t __p0, int16_t __p1) { 57265 int32x4_t __ret; 57266 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 57267 __ret = __noswap_vqdmull_n_s16(__noswap_vget_high_s16(__rev0), __p1); 57268 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 57269 return __ret; 57270 } 57271 #endif 57272 57273 #ifdef __LITTLE_ENDIAN__ 57274 #define vqdmulls_lane_s32(__p0_668, __p1_668, __p2_668) __extension__ ({ \ 57275 int64_t __ret_668; \ 57276 int32_t __s0_668 = __p0_668; \ 57277 int32x2_t __s1_668 = __p1_668; \ 57278 __ret_668 = vqdmulls_s32(__s0_668, vget_lane_s32(__s1_668, __p2_668)); \ 57279 __ret_668; \ 57280 }) 57281 #else 57282 #define vqdmulls_lane_s32(__p0_669, __p1_669, __p2_669) __extension__ ({ \ 57283 int64_t __ret_669; \ 57284 int32_t __s0_669 = __p0_669; \ 57285 int32x2_t __s1_669 = __p1_669; \ 57286 int32x2_t __rev1_669; __rev1_669 = __builtin_shufflevector(__s1_669, __s1_669, 1, 0); \ 57287 __ret_669 = vqdmulls_s32(__s0_669, __noswap_vget_lane_s32(__rev1_669, __p2_669)); \ 57288 __ret_669; \ 57289 }) 57290 #endif 57291 57292 #ifdef __LITTLE_ENDIAN__ 57293 #define vqdmullh_lane_s16(__p0_670, __p1_670, __p2_670) __extension__ ({ \ 57294 int32_t __ret_670; \ 57295 int16_t __s0_670 = __p0_670; \ 57296 int16x4_t __s1_670 = __p1_670; \ 57297 __ret_670 = vqdmullh_s16(__s0_670, vget_lane_s16(__s1_670, __p2_670)); \ 57298 __ret_670; \ 57299 }) 57300 #else 57301 #define vqdmullh_lane_s16(__p0_671, __p1_671, __p2_671) __extension__ ({ \ 57302 int32_t __ret_671; \ 57303 int16_t __s0_671 = __p0_671; \ 57304 int16x4_t __s1_671 = __p1_671; \ 57305 int16x4_t __rev1_671; __rev1_671 = __builtin_shufflevector(__s1_671, __s1_671, 3, 2, 1, 0); \ 57306 __ret_671 = vqdmullh_s16(__s0_671, __noswap_vget_lane_s16(__rev1_671, __p2_671)); \ 57307 __ret_671; \ 57308 }) 57309 #endif 57310 57311 #ifdef __LITTLE_ENDIAN__ 57312 #define vqdmulls_laneq_s32(__p0_672, __p1_672, __p2_672) __extension__ ({ \ 57313 int64_t __ret_672; \ 57314 int32_t __s0_672 = __p0_672; \ 57315 int32x4_t __s1_672 = __p1_672; \ 57316 __ret_672 = vqdmulls_s32(__s0_672, vgetq_lane_s32(__s1_672, __p2_672)); \ 57317 __ret_672; \ 57318 }) 57319 #else 57320 #define vqdmulls_laneq_s32(__p0_673, __p1_673, __p2_673) __extension__ ({ \ 57321 int64_t __ret_673; \ 57322 int32_t __s0_673 = __p0_673; \ 57323 int32x4_t __s1_673 = __p1_673; \ 57324 int32x4_t __rev1_673; __rev1_673 = __builtin_shufflevector(__s1_673, __s1_673, 3, 2, 1, 0); \ 57325 __ret_673 = vqdmulls_s32(__s0_673, __noswap_vgetq_lane_s32(__rev1_673, __p2_673)); \ 57326 __ret_673; \ 57327 }) 57328 #endif 57329 57330 #ifdef __LITTLE_ENDIAN__ 57331 #define vqdmullh_laneq_s16(__p0_674, __p1_674, __p2_674) __extension__ ({ \ 57332 int32_t __ret_674; \ 57333 int16_t __s0_674 = __p0_674; \ 57334 int16x8_t __s1_674 = __p1_674; \ 57335 __ret_674 = vqdmullh_s16(__s0_674, vgetq_lane_s16(__s1_674, __p2_674)); \ 57336 __ret_674; \ 57337 }) 57338 #else 57339 #define vqdmullh_laneq_s16(__p0_675, __p1_675, __p2_675) __extension__ ({ \ 57340 int32_t __ret_675; \ 57341 int16_t __s0_675 = __p0_675; \ 57342 int16x8_t __s1_675 = __p1_675; \ 57343 int16x8_t __rev1_675; __rev1_675 = __builtin_shufflevector(__s1_675, __s1_675, 7, 6, 5, 4, 3, 2, 1, 0); \ 57344 __ret_675 = vqdmullh_s16(__s0_675, __noswap_vgetq_lane_s16(__rev1_675, __p2_675)); \ 57345 __ret_675; \ 57346 }) 57347 #endif 57348 57349 #ifdef __LITTLE_ENDIAN__ 57350 #define vqdmull_laneq_s32(__p0_676, __p1_676, __p2_676) __extension__ ({ \ 57351 int64x2_t __ret_676; \ 57352 int32x2_t __s0_676 = __p0_676; \ 57353 int32x4_t __s1_676 = __p1_676; \ 57354 __ret_676 = vqdmull_s32(__s0_676, splat_laneq_s32(__s1_676, __p2_676)); \ 57355 __ret_676; \ 57356 }) 57357 #else 57358 #define vqdmull_laneq_s32(__p0_677, __p1_677, __p2_677) __extension__ ({ \ 57359 int64x2_t __ret_677; \ 57360 int32x2_t __s0_677 = __p0_677; \ 57361 int32x4_t __s1_677 = __p1_677; \ 57362 int32x2_t __rev0_677; __rev0_677 = __builtin_shufflevector(__s0_677, __s0_677, 1, 0); \ 57363 int32x4_t __rev1_677; __rev1_677 = __builtin_shufflevector(__s1_677, __s1_677, 3, 2, 1, 0); \ 57364 __ret_677 = __noswap_vqdmull_s32(__rev0_677, __noswap_splat_laneq_s32(__rev1_677, __p2_677)); \ 57365 __ret_677 = __builtin_shufflevector(__ret_677, __ret_677, 1, 0); \ 57366 __ret_677; \ 57367 }) 57368 #endif 57369 57370 #ifdef __LITTLE_ENDIAN__ 57371 #define vqdmull_laneq_s16(__p0_678, __p1_678, __p2_678) __extension__ ({ \ 57372 int32x4_t __ret_678; \ 57373 int16x4_t __s0_678 = __p0_678; \ 57374 int16x8_t __s1_678 = __p1_678; \ 57375 __ret_678 = vqdmull_s16(__s0_678, splat_laneq_s16(__s1_678, __p2_678)); \ 57376 __ret_678; \ 57377 }) 57378 #else 57379 #define vqdmull_laneq_s16(__p0_679, __p1_679, __p2_679) __extension__ ({ \ 57380 int32x4_t __ret_679; \ 57381 int16x4_t __s0_679 = __p0_679; \ 57382 int16x8_t __s1_679 = __p1_679; \ 57383 int16x4_t __rev0_679; __rev0_679 = __builtin_shufflevector(__s0_679, __s0_679, 3, 2, 1, 0); \ 57384 int16x8_t __rev1_679; __rev1_679 = __builtin_shufflevector(__s1_679, __s1_679, 7, 6, 5, 4, 3, 2, 1, 0); \ 57385 __ret_679 = __noswap_vqdmull_s16(__rev0_679, __noswap_splat_laneq_s16(__rev1_679, __p2_679)); \ 57386 __ret_679 = __builtin_shufflevector(__ret_679, __ret_679, 3, 2, 1, 0); \ 57387 __ret_679; \ 57388 }) 57389 #endif 57390 57391 __ai __attribute__((target("neon"))) int16_t vqmovns_s32(int32_t __p0) { 57392 int16_t __ret; 57393 __ret = (int16_t) __builtin_neon_vqmovns_s32(__p0); 57394 return __ret; 57395 } 57396 __ai __attribute__((target("neon"))) int32_t vqmovnd_s64(int64_t __p0) { 57397 int32_t __ret; 57398 __ret = (int32_t) __builtin_neon_vqmovnd_s64(__p0); 57399 return __ret; 57400 } 57401 __ai __attribute__((target("neon"))) int8_t vqmovnh_s16(int16_t __p0) { 57402 int8_t __ret; 57403 __ret = (int8_t) __builtin_neon_vqmovnh_s16(__p0); 57404 return __ret; 57405 } 57406 __ai __attribute__((target("neon"))) uint16_t vqmovns_u32(uint32_t __p0) { 57407 uint16_t __ret; 57408 __ret = (uint16_t) __builtin_neon_vqmovns_u32(__p0); 57409 return __ret; 57410 } 57411 __ai __attribute__((target("neon"))) uint32_t vqmovnd_u64(uint64_t __p0) { 57412 uint32_t __ret; 57413 __ret = (uint32_t) __builtin_neon_vqmovnd_u64(__p0); 57414 return __ret; 57415 } 57416 __ai __attribute__((target("neon"))) uint8_t vqmovnh_u16(uint16_t __p0) { 57417 uint8_t __ret; 57418 __ret = (uint8_t) __builtin_neon_vqmovnh_u16(__p0); 57419 return __ret; 57420 } 57421 #ifdef __LITTLE_ENDIAN__ 57422 __ai __attribute__((target("neon"))) uint16x8_t vqmovn_high_u32(uint16x4_t __p0, uint32x4_t __p1) { 57423 uint16x8_t __ret; 57424 __ret = vcombine_u16(__p0, vqmovn_u32(__p1)); 57425 return __ret; 57426 } 57427 #else 57428 __ai __attribute__((target("neon"))) uint16x8_t vqmovn_high_u32(uint16x4_t __p0, uint32x4_t __p1) { 57429 uint16x8_t __ret; 57430 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 57431 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 57432 __ret = __noswap_vcombine_u16(__rev0, __noswap_vqmovn_u32(__rev1)); 57433 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 57434 return __ret; 57435 } 57436 #endif 57437 57438 #ifdef __LITTLE_ENDIAN__ 57439 __ai __attribute__((target("neon"))) uint32x4_t vqmovn_high_u64(uint32x2_t __p0, uint64x2_t __p1) { 57440 uint32x4_t __ret; 57441 __ret = vcombine_u32(__p0, vqmovn_u64(__p1)); 57442 return __ret; 57443 } 57444 #else 57445 __ai __attribute__((target("neon"))) uint32x4_t vqmovn_high_u64(uint32x2_t __p0, uint64x2_t __p1) { 57446 uint32x4_t __ret; 57447 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 57448 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 57449 __ret = __noswap_vcombine_u32(__rev0, __noswap_vqmovn_u64(__rev1)); 57450 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 57451 return __ret; 57452 } 57453 #endif 57454 57455 #ifdef __LITTLE_ENDIAN__ 57456 __ai __attribute__((target("neon"))) uint8x16_t vqmovn_high_u16(uint8x8_t __p0, uint16x8_t __p1) { 57457 uint8x16_t __ret; 57458 __ret = vcombine_u8(__p0, vqmovn_u16(__p1)); 57459 return __ret; 57460 } 57461 #else 57462 __ai __attribute__((target("neon"))) uint8x16_t vqmovn_high_u16(uint8x8_t __p0, uint16x8_t __p1) { 57463 uint8x16_t __ret; 57464 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 57465 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 57466 __ret = __noswap_vcombine_u8(__rev0, __noswap_vqmovn_u16(__rev1)); 57467 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 57468 return __ret; 57469 } 57470 #endif 57471 57472 #ifdef __LITTLE_ENDIAN__ 57473 __ai __attribute__((target("neon"))) int16x8_t vqmovn_high_s32(int16x4_t __p0, int32x4_t __p1) { 57474 int16x8_t __ret; 57475 __ret = vcombine_s16(__p0, vqmovn_s32(__p1)); 57476 return __ret; 57477 } 57478 #else 57479 __ai __attribute__((target("neon"))) int16x8_t vqmovn_high_s32(int16x4_t __p0, int32x4_t __p1) { 57480 int16x8_t __ret; 57481 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 57482 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 57483 __ret = __noswap_vcombine_s16(__rev0, __noswap_vqmovn_s32(__rev1)); 57484 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 57485 return __ret; 57486 } 57487 #endif 57488 57489 #ifdef __LITTLE_ENDIAN__ 57490 __ai __attribute__((target("neon"))) int32x4_t vqmovn_high_s64(int32x2_t __p0, int64x2_t __p1) { 57491 int32x4_t __ret; 57492 __ret = vcombine_s32(__p0, vqmovn_s64(__p1)); 57493 return __ret; 57494 } 57495 #else 57496 __ai __attribute__((target("neon"))) int32x4_t vqmovn_high_s64(int32x2_t __p0, int64x2_t __p1) { 57497 int32x4_t __ret; 57498 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 57499 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 57500 __ret = __noswap_vcombine_s32(__rev0, __noswap_vqmovn_s64(__rev1)); 57501 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 57502 return __ret; 57503 } 57504 #endif 57505 57506 #ifdef __LITTLE_ENDIAN__ 57507 __ai __attribute__((target("neon"))) int8x16_t vqmovn_high_s16(int8x8_t __p0, int16x8_t __p1) { 57508 int8x16_t __ret; 57509 __ret = vcombine_s8(__p0, vqmovn_s16(__p1)); 57510 return __ret; 57511 } 57512 #else 57513 __ai __attribute__((target("neon"))) int8x16_t vqmovn_high_s16(int8x8_t __p0, int16x8_t __p1) { 57514 int8x16_t __ret; 57515 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 57516 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 57517 __ret = __noswap_vcombine_s8(__rev0, __noswap_vqmovn_s16(__rev1)); 57518 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 57519 return __ret; 57520 } 57521 #endif 57522 57523 __ai __attribute__((target("neon"))) uint16_t vqmovuns_s32(int32_t __p0) { 57524 uint16_t __ret; 57525 __ret = (uint16_t) __builtin_neon_vqmovuns_s32(__p0); 57526 return __ret; 57527 } 57528 __ai __attribute__((target("neon"))) uint32_t vqmovund_s64(int64_t __p0) { 57529 uint32_t __ret; 57530 __ret = (uint32_t) __builtin_neon_vqmovund_s64(__p0); 57531 return __ret; 57532 } 57533 __ai __attribute__((target("neon"))) uint8_t vqmovunh_s16(int16_t __p0) { 57534 uint8_t __ret; 57535 __ret = (uint8_t) __builtin_neon_vqmovunh_s16(__p0); 57536 return __ret; 57537 } 57538 #ifdef __LITTLE_ENDIAN__ 57539 __ai __attribute__((target("neon"))) uint16x8_t vqmovun_high_s32(uint16x4_t __p0, int32x4_t __p1) { 57540 uint16x8_t __ret; 57541 __ret = vcombine_u16((uint16x4_t)(__p0), vqmovun_s32(__p1)); 57542 return __ret; 57543 } 57544 #else 57545 __ai __attribute__((target("neon"))) uint16x8_t vqmovun_high_s32(uint16x4_t __p0, int32x4_t __p1) { 57546 uint16x8_t __ret; 57547 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 57548 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 57549 __ret = __noswap_vcombine_u16((uint16x4_t)(__rev0), __noswap_vqmovun_s32(__rev1)); 57550 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 57551 return __ret; 57552 } 57553 #endif 57554 57555 #ifdef __LITTLE_ENDIAN__ 57556 __ai __attribute__((target("neon"))) uint32x4_t vqmovun_high_s64(uint32x2_t __p0, int64x2_t __p1) { 57557 uint32x4_t __ret; 57558 __ret = vcombine_u32((uint32x2_t)(__p0), vqmovun_s64(__p1)); 57559 return __ret; 57560 } 57561 #else 57562 __ai __attribute__((target("neon"))) uint32x4_t vqmovun_high_s64(uint32x2_t __p0, int64x2_t __p1) { 57563 uint32x4_t __ret; 57564 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 57565 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 57566 __ret = __noswap_vcombine_u32((uint32x2_t)(__rev0), __noswap_vqmovun_s64(__rev1)); 57567 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 57568 return __ret; 57569 } 57570 #endif 57571 57572 #ifdef __LITTLE_ENDIAN__ 57573 __ai __attribute__((target("neon"))) uint8x16_t vqmovun_high_s16(uint8x8_t __p0, int16x8_t __p1) { 57574 uint8x16_t __ret; 57575 __ret = vcombine_u8((uint8x8_t)(__p0), vqmovun_s16(__p1)); 57576 return __ret; 57577 } 57578 #else 57579 __ai __attribute__((target("neon"))) uint8x16_t vqmovun_high_s16(uint8x8_t __p0, int16x8_t __p1) { 57580 uint8x16_t __ret; 57581 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 57582 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 57583 __ret = __noswap_vcombine_u8((uint8x8_t)(__rev0), __noswap_vqmovun_s16(__rev1)); 57584 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 57585 return __ret; 57586 } 57587 #endif 57588 57589 #ifdef __LITTLE_ENDIAN__ 57590 __ai __attribute__((target("neon"))) int64x2_t vqnegq_s64(int64x2_t __p0) { 57591 int64x2_t __ret; 57592 __ret = (int64x2_t) __builtin_neon_vqnegq_v((int8x16_t)__p0, 35); 57593 return __ret; 57594 } 57595 #else 57596 __ai __attribute__((target("neon"))) int64x2_t vqnegq_s64(int64x2_t __p0) { 57597 int64x2_t __ret; 57598 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 57599 __ret = (int64x2_t) __builtin_neon_vqnegq_v((int8x16_t)__rev0, 35); 57600 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 57601 return __ret; 57602 } 57603 #endif 57604 57605 __ai __attribute__((target("neon"))) int64x1_t vqneg_s64(int64x1_t __p0) { 57606 int64x1_t __ret; 57607 __ret = (int64x1_t) __builtin_neon_vqneg_v((int8x8_t)__p0, 3); 57608 return __ret; 57609 } 57610 __ai __attribute__((target("neon"))) int8_t vqnegb_s8(int8_t __p0) { 57611 int8_t __ret; 57612 __ret = (int8_t) __builtin_neon_vqnegb_s8(__p0); 57613 return __ret; 57614 } 57615 __ai __attribute__((target("neon"))) int32_t vqnegs_s32(int32_t __p0) { 57616 int32_t __ret; 57617 __ret = (int32_t) __builtin_neon_vqnegs_s32(__p0); 57618 return __ret; 57619 } 57620 __ai __attribute__((target("neon"))) int64_t vqnegd_s64(int64_t __p0) { 57621 int64_t __ret; 57622 __ret = (int64_t) __builtin_neon_vqnegd_s64(__p0); 57623 return __ret; 57624 } 57625 __ai __attribute__((target("neon"))) int16_t vqnegh_s16(int16_t __p0) { 57626 int16_t __ret; 57627 __ret = (int16_t) __builtin_neon_vqnegh_s16(__p0); 57628 return __ret; 57629 } 57630 __ai __attribute__((target("neon"))) int32_t vqrdmulhs_s32(int32_t __p0, int32_t __p1) { 57631 int32_t __ret; 57632 __ret = (int32_t) __builtin_neon_vqrdmulhs_s32(__p0, __p1); 57633 return __ret; 57634 } 57635 __ai __attribute__((target("neon"))) int16_t vqrdmulhh_s16(int16_t __p0, int16_t __p1) { 57636 int16_t __ret; 57637 __ret = (int16_t) __builtin_neon_vqrdmulhh_s16(__p0, __p1); 57638 return __ret; 57639 } 57640 #ifdef __LITTLE_ENDIAN__ 57641 #define vqrdmulhq_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 57642 int32x4_t __ret; \ 57643 int32x4_t __s0 = __p0; \ 57644 int32x2_t __s1 = __p1; \ 57645 __ret = (int32x4_t) __builtin_neon_vqrdmulhq_lane_v((int8x16_t)__s0, (int8x8_t)__s1, __p2, 2); \ 57646 __ret; \ 57647 }) 57648 #else 57649 #define vqrdmulhq_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 57650 int32x4_t __ret; \ 57651 int32x4_t __s0 = __p0; \ 57652 int32x2_t __s1 = __p1; \ 57653 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 57654 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 57655 __ret = (int32x4_t) __builtin_neon_vqrdmulhq_lane_v((int8x16_t)__rev0, (int8x8_t)__rev1, __p2, 2); \ 57656 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 57657 __ret; \ 57658 }) 57659 #endif 57660 57661 #ifdef __LITTLE_ENDIAN__ 57662 #define vqrdmulhq_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 57663 int16x8_t __ret; \ 57664 int16x8_t __s0 = __p0; \ 57665 int16x4_t __s1 = __p1; \ 57666 __ret = (int16x8_t) __builtin_neon_vqrdmulhq_lane_v((int8x16_t)__s0, (int8x8_t)__s1, __p2, 1); \ 57667 __ret; \ 57668 }) 57669 #else 57670 #define vqrdmulhq_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 57671 int16x8_t __ret; \ 57672 int16x8_t __s0 = __p0; \ 57673 int16x4_t __s1 = __p1; \ 57674 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 57675 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 57676 __ret = (int16x8_t) __builtin_neon_vqrdmulhq_lane_v((int8x16_t)__rev0, (int8x8_t)__rev1, __p2, 1); \ 57677 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 57678 __ret; \ 57679 }) 57680 #endif 57681 57682 #ifdef __LITTLE_ENDIAN__ 57683 #define vqrdmulh_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 57684 int32x2_t __ret; \ 57685 int32x2_t __s0 = __p0; \ 57686 int32x2_t __s1 = __p1; \ 57687 __ret = (int32x2_t) __builtin_neon_vqrdmulh_lane_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 2); \ 57688 __ret; \ 57689 }) 57690 #else 57691 #define vqrdmulh_lane_s32(__p0, __p1, __p2) __extension__ ({ \ 57692 int32x2_t __ret; \ 57693 int32x2_t __s0 = __p0; \ 57694 int32x2_t __s1 = __p1; \ 57695 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 57696 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 57697 __ret = (int32x2_t) __builtin_neon_vqrdmulh_lane_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 2); \ 57698 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 57699 __ret; \ 57700 }) 57701 #endif 57702 57703 #ifdef __LITTLE_ENDIAN__ 57704 #define vqrdmulh_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 57705 int16x4_t __ret; \ 57706 int16x4_t __s0 = __p0; \ 57707 int16x4_t __s1 = __p1; \ 57708 __ret = (int16x4_t) __builtin_neon_vqrdmulh_lane_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 1); \ 57709 __ret; \ 57710 }) 57711 #else 57712 #define vqrdmulh_lane_s16(__p0, __p1, __p2) __extension__ ({ \ 57713 int16x4_t __ret; \ 57714 int16x4_t __s0 = __p0; \ 57715 int16x4_t __s1 = __p1; \ 57716 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 57717 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 57718 __ret = (int16x4_t) __builtin_neon_vqrdmulh_lane_v((int8x8_t)__rev0, (int8x8_t)__rev1, __p2, 1); \ 57719 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 57720 __ret; \ 57721 }) 57722 #endif 57723 57724 #ifdef __LITTLE_ENDIAN__ 57725 #define vqrdmulhs_lane_s32(__p0_680, __p1_680, __p2_680) __extension__ ({ \ 57726 int32_t __ret_680; \ 57727 int32_t __s0_680 = __p0_680; \ 57728 int32x2_t __s1_680 = __p1_680; \ 57729 __ret_680 = vqrdmulhs_s32(__s0_680, vget_lane_s32(__s1_680, __p2_680)); \ 57730 __ret_680; \ 57731 }) 57732 #else 57733 #define vqrdmulhs_lane_s32(__p0_681, __p1_681, __p2_681) __extension__ ({ \ 57734 int32_t __ret_681; \ 57735 int32_t __s0_681 = __p0_681; \ 57736 int32x2_t __s1_681 = __p1_681; \ 57737 int32x2_t __rev1_681; __rev1_681 = __builtin_shufflevector(__s1_681, __s1_681, 1, 0); \ 57738 __ret_681 = vqrdmulhs_s32(__s0_681, __noswap_vget_lane_s32(__rev1_681, __p2_681)); \ 57739 __ret_681; \ 57740 }) 57741 #endif 57742 57743 #ifdef __LITTLE_ENDIAN__ 57744 #define vqrdmulhh_lane_s16(__p0_682, __p1_682, __p2_682) __extension__ ({ \ 57745 int16_t __ret_682; \ 57746 int16_t __s0_682 = __p0_682; \ 57747 int16x4_t __s1_682 = __p1_682; \ 57748 __ret_682 = vqrdmulhh_s16(__s0_682, vget_lane_s16(__s1_682, __p2_682)); \ 57749 __ret_682; \ 57750 }) 57751 #else 57752 #define vqrdmulhh_lane_s16(__p0_683, __p1_683, __p2_683) __extension__ ({ \ 57753 int16_t __ret_683; \ 57754 int16_t __s0_683 = __p0_683; \ 57755 int16x4_t __s1_683 = __p1_683; \ 57756 int16x4_t __rev1_683; __rev1_683 = __builtin_shufflevector(__s1_683, __s1_683, 3, 2, 1, 0); \ 57757 __ret_683 = vqrdmulhh_s16(__s0_683, __noswap_vget_lane_s16(__rev1_683, __p2_683)); \ 57758 __ret_683; \ 57759 }) 57760 #endif 57761 57762 #ifdef __LITTLE_ENDIAN__ 57763 #define vqrdmulhs_laneq_s32(__p0_684, __p1_684, __p2_684) __extension__ ({ \ 57764 int32_t __ret_684; \ 57765 int32_t __s0_684 = __p0_684; \ 57766 int32x4_t __s1_684 = __p1_684; \ 57767 __ret_684 = vqrdmulhs_s32(__s0_684, vgetq_lane_s32(__s1_684, __p2_684)); \ 57768 __ret_684; \ 57769 }) 57770 #else 57771 #define vqrdmulhs_laneq_s32(__p0_685, __p1_685, __p2_685) __extension__ ({ \ 57772 int32_t __ret_685; \ 57773 int32_t __s0_685 = __p0_685; \ 57774 int32x4_t __s1_685 = __p1_685; \ 57775 int32x4_t __rev1_685; __rev1_685 = __builtin_shufflevector(__s1_685, __s1_685, 3, 2, 1, 0); \ 57776 __ret_685 = vqrdmulhs_s32(__s0_685, __noswap_vgetq_lane_s32(__rev1_685, __p2_685)); \ 57777 __ret_685; \ 57778 }) 57779 #endif 57780 57781 #ifdef __LITTLE_ENDIAN__ 57782 #define vqrdmulhh_laneq_s16(__p0_686, __p1_686, __p2_686) __extension__ ({ \ 57783 int16_t __ret_686; \ 57784 int16_t __s0_686 = __p0_686; \ 57785 int16x8_t __s1_686 = __p1_686; \ 57786 __ret_686 = vqrdmulhh_s16(__s0_686, vgetq_lane_s16(__s1_686, __p2_686)); \ 57787 __ret_686; \ 57788 }) 57789 #else 57790 #define vqrdmulhh_laneq_s16(__p0_687, __p1_687, __p2_687) __extension__ ({ \ 57791 int16_t __ret_687; \ 57792 int16_t __s0_687 = __p0_687; \ 57793 int16x8_t __s1_687 = __p1_687; \ 57794 int16x8_t __rev1_687; __rev1_687 = __builtin_shufflevector(__s1_687, __s1_687, 7, 6, 5, 4, 3, 2, 1, 0); \ 57795 __ret_687 = vqrdmulhh_s16(__s0_687, __noswap_vgetq_lane_s16(__rev1_687, __p2_687)); \ 57796 __ret_687; \ 57797 }) 57798 #endif 57799 57800 #ifdef __LITTLE_ENDIAN__ 57801 #define vqrdmulhq_laneq_s32(__p0, __p1, __p2) __extension__ ({ \ 57802 int32x4_t __ret; \ 57803 int32x4_t __s0 = __p0; \ 57804 int32x4_t __s1 = __p1; \ 57805 __ret = (int32x4_t) __builtin_neon_vqrdmulhq_laneq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 34); \ 57806 __ret; \ 57807 }) 57808 #else 57809 #define vqrdmulhq_laneq_s32(__p0, __p1, __p2) __extension__ ({ \ 57810 int32x4_t __ret; \ 57811 int32x4_t __s0 = __p0; \ 57812 int32x4_t __s1 = __p1; \ 57813 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 57814 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 57815 __ret = (int32x4_t) __builtin_neon_vqrdmulhq_laneq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 34); \ 57816 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 57817 __ret; \ 57818 }) 57819 #endif 57820 57821 #ifdef __LITTLE_ENDIAN__ 57822 #define vqrdmulhq_laneq_s16(__p0, __p1, __p2) __extension__ ({ \ 57823 int16x8_t __ret; \ 57824 int16x8_t __s0 = __p0; \ 57825 int16x8_t __s1 = __p1; \ 57826 __ret = (int16x8_t) __builtin_neon_vqrdmulhq_laneq_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 33); \ 57827 __ret; \ 57828 }) 57829 #else 57830 #define vqrdmulhq_laneq_s16(__p0, __p1, __p2) __extension__ ({ \ 57831 int16x8_t __ret; \ 57832 int16x8_t __s0 = __p0; \ 57833 int16x8_t __s1 = __p1; \ 57834 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 7, 6, 5, 4, 3, 2, 1, 0); \ 57835 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 57836 __ret = (int16x8_t) __builtin_neon_vqrdmulhq_laneq_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 33); \ 57837 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); \ 57838 __ret; \ 57839 }) 57840 #endif 57841 57842 #ifdef __LITTLE_ENDIAN__ 57843 #define vqrdmulh_laneq_s32(__p0, __p1, __p2) __extension__ ({ \ 57844 int32x2_t __ret; \ 57845 int32x2_t __s0 = __p0; \ 57846 int32x4_t __s1 = __p1; \ 57847 __ret = (int32x2_t) __builtin_neon_vqrdmulh_laneq_v((int8x8_t)__s0, (int8x16_t)__s1, __p2, 2); \ 57848 __ret; \ 57849 }) 57850 #else 57851 #define vqrdmulh_laneq_s32(__p0, __p1, __p2) __extension__ ({ \ 57852 int32x2_t __ret; \ 57853 int32x2_t __s0 = __p0; \ 57854 int32x4_t __s1 = __p1; \ 57855 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 57856 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 57857 __ret = (int32x2_t) __builtin_neon_vqrdmulh_laneq_v((int8x8_t)__rev0, (int8x16_t)__rev1, __p2, 2); \ 57858 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 57859 __ret; \ 57860 }) 57861 #endif 57862 57863 #ifdef __LITTLE_ENDIAN__ 57864 #define vqrdmulh_laneq_s16(__p0, __p1, __p2) __extension__ ({ \ 57865 int16x4_t __ret; \ 57866 int16x4_t __s0 = __p0; \ 57867 int16x8_t __s1 = __p1; \ 57868 __ret = (int16x4_t) __builtin_neon_vqrdmulh_laneq_v((int8x8_t)__s0, (int8x16_t)__s1, __p2, 1); \ 57869 __ret; \ 57870 }) 57871 #else 57872 #define vqrdmulh_laneq_s16(__p0, __p1, __p2) __extension__ ({ \ 57873 int16x4_t __ret; \ 57874 int16x4_t __s0 = __p0; \ 57875 int16x8_t __s1 = __p1; \ 57876 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 57877 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 7, 6, 5, 4, 3, 2, 1, 0); \ 57878 __ret = (int16x4_t) __builtin_neon_vqrdmulh_laneq_v((int8x8_t)__rev0, (int8x16_t)__rev1, __p2, 1); \ 57879 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 57880 __ret; \ 57881 }) 57882 #endif 57883 57884 __ai __attribute__((target("neon"))) uint8_t vqrshlb_u8(uint8_t __p0, int8_t __p1) { 57885 uint8_t __ret; 57886 __ret = (uint8_t) __builtin_neon_vqrshlb_u8(__p0, __p1); 57887 return __ret; 57888 } 57889 __ai __attribute__((target("neon"))) uint32_t vqrshls_u32(uint32_t __p0, int32_t __p1) { 57890 uint32_t __ret; 57891 __ret = (uint32_t) __builtin_neon_vqrshls_u32(__p0, __p1); 57892 return __ret; 57893 } 57894 __ai __attribute__((target("neon"))) uint64_t vqrshld_u64(uint64_t __p0, int64_t __p1) { 57895 uint64_t __ret; 57896 __ret = (uint64_t) __builtin_neon_vqrshld_u64(__p0, __p1); 57897 return __ret; 57898 } 57899 __ai __attribute__((target("neon"))) uint16_t vqrshlh_u16(uint16_t __p0, int16_t __p1) { 57900 uint16_t __ret; 57901 __ret = (uint16_t) __builtin_neon_vqrshlh_u16(__p0, __p1); 57902 return __ret; 57903 } 57904 __ai __attribute__((target("neon"))) int8_t vqrshlb_s8(int8_t __p0, int8_t __p1) { 57905 int8_t __ret; 57906 __ret = (int8_t) __builtin_neon_vqrshlb_s8(__p0, __p1); 57907 return __ret; 57908 } 57909 __ai __attribute__((target("neon"))) int32_t vqrshls_s32(int32_t __p0, int32_t __p1) { 57910 int32_t __ret; 57911 __ret = (int32_t) __builtin_neon_vqrshls_s32(__p0, __p1); 57912 return __ret; 57913 } 57914 __ai __attribute__((target("neon"))) int64_t vqrshld_s64(int64_t __p0, int64_t __p1) { 57915 int64_t __ret; 57916 __ret = (int64_t) __builtin_neon_vqrshld_s64(__p0, __p1); 57917 return __ret; 57918 } 57919 __ai __attribute__((target("neon"))) int16_t vqrshlh_s16(int16_t __p0, int16_t __p1) { 57920 int16_t __ret; 57921 __ret = (int16_t) __builtin_neon_vqrshlh_s16(__p0, __p1); 57922 return __ret; 57923 } 57924 #ifdef __LITTLE_ENDIAN__ 57925 #define vqrshrn_high_n_u32(__p0_688, __p1_688, __p2_688) __extension__ ({ \ 57926 uint16x8_t __ret_688; \ 57927 uint16x4_t __s0_688 = __p0_688; \ 57928 uint32x4_t __s1_688 = __p1_688; \ 57929 __ret_688 = (uint16x8_t)(vcombine_u16((uint16x4_t)(__s0_688), (uint16x4_t)(vqrshrn_n_u32(__s1_688, __p2_688)))); \ 57930 __ret_688; \ 57931 }) 57932 #else 57933 #define vqrshrn_high_n_u32(__p0_689, __p1_689, __p2_689) __extension__ ({ \ 57934 uint16x8_t __ret_689; \ 57935 uint16x4_t __s0_689 = __p0_689; \ 57936 uint32x4_t __s1_689 = __p1_689; \ 57937 uint16x4_t __rev0_689; __rev0_689 = __builtin_shufflevector(__s0_689, __s0_689, 3, 2, 1, 0); \ 57938 uint32x4_t __rev1_689; __rev1_689 = __builtin_shufflevector(__s1_689, __s1_689, 3, 2, 1, 0); \ 57939 __ret_689 = (uint16x8_t)(__noswap_vcombine_u16((uint16x4_t)(__rev0_689), (uint16x4_t)(__noswap_vqrshrn_n_u32(__rev1_689, __p2_689)))); \ 57940 __ret_689 = __builtin_shufflevector(__ret_689, __ret_689, 7, 6, 5, 4, 3, 2, 1, 0); \ 57941 __ret_689; \ 57942 }) 57943 #endif 57944 57945 #ifdef __LITTLE_ENDIAN__ 57946 #define vqrshrn_high_n_u64(__p0_690, __p1_690, __p2_690) __extension__ ({ \ 57947 uint32x4_t __ret_690; \ 57948 uint32x2_t __s0_690 = __p0_690; \ 57949 uint64x2_t __s1_690 = __p1_690; \ 57950 __ret_690 = (uint32x4_t)(vcombine_u32((uint32x2_t)(__s0_690), (uint32x2_t)(vqrshrn_n_u64(__s1_690, __p2_690)))); \ 57951 __ret_690; \ 57952 }) 57953 #else 57954 #define vqrshrn_high_n_u64(__p0_691, __p1_691, __p2_691) __extension__ ({ \ 57955 uint32x4_t __ret_691; \ 57956 uint32x2_t __s0_691 = __p0_691; \ 57957 uint64x2_t __s1_691 = __p1_691; \ 57958 uint32x2_t __rev0_691; __rev0_691 = __builtin_shufflevector(__s0_691, __s0_691, 1, 0); \ 57959 uint64x2_t __rev1_691; __rev1_691 = __builtin_shufflevector(__s1_691, __s1_691, 1, 0); \ 57960 __ret_691 = (uint32x4_t)(__noswap_vcombine_u32((uint32x2_t)(__rev0_691), (uint32x2_t)(__noswap_vqrshrn_n_u64(__rev1_691, __p2_691)))); \ 57961 __ret_691 = __builtin_shufflevector(__ret_691, __ret_691, 3, 2, 1, 0); \ 57962 __ret_691; \ 57963 }) 57964 #endif 57965 57966 #ifdef __LITTLE_ENDIAN__ 57967 #define vqrshrn_high_n_u16(__p0_692, __p1_692, __p2_692) __extension__ ({ \ 57968 uint8x16_t __ret_692; \ 57969 uint8x8_t __s0_692 = __p0_692; \ 57970 uint16x8_t __s1_692 = __p1_692; \ 57971 __ret_692 = (uint8x16_t)(vcombine_u8((uint8x8_t)(__s0_692), (uint8x8_t)(vqrshrn_n_u16(__s1_692, __p2_692)))); \ 57972 __ret_692; \ 57973 }) 57974 #else 57975 #define vqrshrn_high_n_u16(__p0_693, __p1_693, __p2_693) __extension__ ({ \ 57976 uint8x16_t __ret_693; \ 57977 uint8x8_t __s0_693 = __p0_693; \ 57978 uint16x8_t __s1_693 = __p1_693; \ 57979 uint8x8_t __rev0_693; __rev0_693 = __builtin_shufflevector(__s0_693, __s0_693, 7, 6, 5, 4, 3, 2, 1, 0); \ 57980 uint16x8_t __rev1_693; __rev1_693 = __builtin_shufflevector(__s1_693, __s1_693, 7, 6, 5, 4, 3, 2, 1, 0); \ 57981 __ret_693 = (uint8x16_t)(__noswap_vcombine_u8((uint8x8_t)(__rev0_693), (uint8x8_t)(__noswap_vqrshrn_n_u16(__rev1_693, __p2_693)))); \ 57982 __ret_693 = __builtin_shufflevector(__ret_693, __ret_693, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 57983 __ret_693; \ 57984 }) 57985 #endif 57986 57987 #ifdef __LITTLE_ENDIAN__ 57988 #define vqrshrn_high_n_s32(__p0_694, __p1_694, __p2_694) __extension__ ({ \ 57989 int16x8_t __ret_694; \ 57990 int16x4_t __s0_694 = __p0_694; \ 57991 int32x4_t __s1_694 = __p1_694; \ 57992 __ret_694 = (int16x8_t)(vcombine_s16((int16x4_t)(__s0_694), (int16x4_t)(vqrshrn_n_s32(__s1_694, __p2_694)))); \ 57993 __ret_694; \ 57994 }) 57995 #else 57996 #define vqrshrn_high_n_s32(__p0_695, __p1_695, __p2_695) __extension__ ({ \ 57997 int16x8_t __ret_695; \ 57998 int16x4_t __s0_695 = __p0_695; \ 57999 int32x4_t __s1_695 = __p1_695; \ 58000 int16x4_t __rev0_695; __rev0_695 = __builtin_shufflevector(__s0_695, __s0_695, 3, 2, 1, 0); \ 58001 int32x4_t __rev1_695; __rev1_695 = __builtin_shufflevector(__s1_695, __s1_695, 3, 2, 1, 0); \ 58002 __ret_695 = (int16x8_t)(__noswap_vcombine_s16((int16x4_t)(__rev0_695), (int16x4_t)(__noswap_vqrshrn_n_s32(__rev1_695, __p2_695)))); \ 58003 __ret_695 = __builtin_shufflevector(__ret_695, __ret_695, 7, 6, 5, 4, 3, 2, 1, 0); \ 58004 __ret_695; \ 58005 }) 58006 #endif 58007 58008 #ifdef __LITTLE_ENDIAN__ 58009 #define vqrshrn_high_n_s64(__p0_696, __p1_696, __p2_696) __extension__ ({ \ 58010 int32x4_t __ret_696; \ 58011 int32x2_t __s0_696 = __p0_696; \ 58012 int64x2_t __s1_696 = __p1_696; \ 58013 __ret_696 = (int32x4_t)(vcombine_s32((int32x2_t)(__s0_696), (int32x2_t)(vqrshrn_n_s64(__s1_696, __p2_696)))); \ 58014 __ret_696; \ 58015 }) 58016 #else 58017 #define vqrshrn_high_n_s64(__p0_697, __p1_697, __p2_697) __extension__ ({ \ 58018 int32x4_t __ret_697; \ 58019 int32x2_t __s0_697 = __p0_697; \ 58020 int64x2_t __s1_697 = __p1_697; \ 58021 int32x2_t __rev0_697; __rev0_697 = __builtin_shufflevector(__s0_697, __s0_697, 1, 0); \ 58022 int64x2_t __rev1_697; __rev1_697 = __builtin_shufflevector(__s1_697, __s1_697, 1, 0); \ 58023 __ret_697 = (int32x4_t)(__noswap_vcombine_s32((int32x2_t)(__rev0_697), (int32x2_t)(__noswap_vqrshrn_n_s64(__rev1_697, __p2_697)))); \ 58024 __ret_697 = __builtin_shufflevector(__ret_697, __ret_697, 3, 2, 1, 0); \ 58025 __ret_697; \ 58026 }) 58027 #endif 58028 58029 #ifdef __LITTLE_ENDIAN__ 58030 #define vqrshrn_high_n_s16(__p0_698, __p1_698, __p2_698) __extension__ ({ \ 58031 int8x16_t __ret_698; \ 58032 int8x8_t __s0_698 = __p0_698; \ 58033 int16x8_t __s1_698 = __p1_698; \ 58034 __ret_698 = (int8x16_t)(vcombine_s8((int8x8_t)(__s0_698), (int8x8_t)(vqrshrn_n_s16(__s1_698, __p2_698)))); \ 58035 __ret_698; \ 58036 }) 58037 #else 58038 #define vqrshrn_high_n_s16(__p0_699, __p1_699, __p2_699) __extension__ ({ \ 58039 int8x16_t __ret_699; \ 58040 int8x8_t __s0_699 = __p0_699; \ 58041 int16x8_t __s1_699 = __p1_699; \ 58042 int8x8_t __rev0_699; __rev0_699 = __builtin_shufflevector(__s0_699, __s0_699, 7, 6, 5, 4, 3, 2, 1, 0); \ 58043 int16x8_t __rev1_699; __rev1_699 = __builtin_shufflevector(__s1_699, __s1_699, 7, 6, 5, 4, 3, 2, 1, 0); \ 58044 __ret_699 = (int8x16_t)(__noswap_vcombine_s8((int8x8_t)(__rev0_699), (int8x8_t)(__noswap_vqrshrn_n_s16(__rev1_699, __p2_699)))); \ 58045 __ret_699 = __builtin_shufflevector(__ret_699, __ret_699, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 58046 __ret_699; \ 58047 }) 58048 #endif 58049 58050 #define vqrshrns_n_u32(__p0, __p1) __extension__ ({ \ 58051 uint16_t __ret; \ 58052 uint32_t __s0 = __p0; \ 58053 __ret = (uint16_t) __builtin_neon_vqrshrns_n_u32(__s0, __p1); \ 58054 __ret; \ 58055 }) 58056 #define vqrshrnd_n_u64(__p0, __p1) __extension__ ({ \ 58057 uint32_t __ret; \ 58058 uint64_t __s0 = __p0; \ 58059 __ret = (uint32_t) __builtin_neon_vqrshrnd_n_u64(__s0, __p1); \ 58060 __ret; \ 58061 }) 58062 #define vqrshrnh_n_u16(__p0, __p1) __extension__ ({ \ 58063 uint8_t __ret; \ 58064 uint16_t __s0 = __p0; \ 58065 __ret = (uint8_t) __builtin_neon_vqrshrnh_n_u16(__s0, __p1); \ 58066 __ret; \ 58067 }) 58068 #define vqrshrns_n_s32(__p0, __p1) __extension__ ({ \ 58069 int16_t __ret; \ 58070 int32_t __s0 = __p0; \ 58071 __ret = (int16_t) __builtin_neon_vqrshrns_n_s32(__s0, __p1); \ 58072 __ret; \ 58073 }) 58074 #define vqrshrnd_n_s64(__p0, __p1) __extension__ ({ \ 58075 int32_t __ret; \ 58076 int64_t __s0 = __p0; \ 58077 __ret = (int32_t) __builtin_neon_vqrshrnd_n_s64(__s0, __p1); \ 58078 __ret; \ 58079 }) 58080 #define vqrshrnh_n_s16(__p0, __p1) __extension__ ({ \ 58081 int8_t __ret; \ 58082 int16_t __s0 = __p0; \ 58083 __ret = (int8_t) __builtin_neon_vqrshrnh_n_s16(__s0, __p1); \ 58084 __ret; \ 58085 }) 58086 #ifdef __LITTLE_ENDIAN__ 58087 #define vqrshrun_high_n_s32(__p0_700, __p1_700, __p2_700) __extension__ ({ \ 58088 int16x8_t __ret_700; \ 58089 int16x4_t __s0_700 = __p0_700; \ 58090 int32x4_t __s1_700 = __p1_700; \ 58091 __ret_700 = (int16x8_t)(vcombine_s16((int16x4_t)(__s0_700), (int16x4_t)(vqrshrun_n_s32(__s1_700, __p2_700)))); \ 58092 __ret_700; \ 58093 }) 58094 #else 58095 #define vqrshrun_high_n_s32(__p0_701, __p1_701, __p2_701) __extension__ ({ \ 58096 int16x8_t __ret_701; \ 58097 int16x4_t __s0_701 = __p0_701; \ 58098 int32x4_t __s1_701 = __p1_701; \ 58099 int16x4_t __rev0_701; __rev0_701 = __builtin_shufflevector(__s0_701, __s0_701, 3, 2, 1, 0); \ 58100 int32x4_t __rev1_701; __rev1_701 = __builtin_shufflevector(__s1_701, __s1_701, 3, 2, 1, 0); \ 58101 __ret_701 = (int16x8_t)(__noswap_vcombine_s16((int16x4_t)(__rev0_701), (int16x4_t)(__noswap_vqrshrun_n_s32(__rev1_701, __p2_701)))); \ 58102 __ret_701 = __builtin_shufflevector(__ret_701, __ret_701, 7, 6, 5, 4, 3, 2, 1, 0); \ 58103 __ret_701; \ 58104 }) 58105 #endif 58106 58107 #ifdef __LITTLE_ENDIAN__ 58108 #define vqrshrun_high_n_s64(__p0_702, __p1_702, __p2_702) __extension__ ({ \ 58109 int32x4_t __ret_702; \ 58110 int32x2_t __s0_702 = __p0_702; \ 58111 int64x2_t __s1_702 = __p1_702; \ 58112 __ret_702 = (int32x4_t)(vcombine_s32((int32x2_t)(__s0_702), (int32x2_t)(vqrshrun_n_s64(__s1_702, __p2_702)))); \ 58113 __ret_702; \ 58114 }) 58115 #else 58116 #define vqrshrun_high_n_s64(__p0_703, __p1_703, __p2_703) __extension__ ({ \ 58117 int32x4_t __ret_703; \ 58118 int32x2_t __s0_703 = __p0_703; \ 58119 int64x2_t __s1_703 = __p1_703; \ 58120 int32x2_t __rev0_703; __rev0_703 = __builtin_shufflevector(__s0_703, __s0_703, 1, 0); \ 58121 int64x2_t __rev1_703; __rev1_703 = __builtin_shufflevector(__s1_703, __s1_703, 1, 0); \ 58122 __ret_703 = (int32x4_t)(__noswap_vcombine_s32((int32x2_t)(__rev0_703), (int32x2_t)(__noswap_vqrshrun_n_s64(__rev1_703, __p2_703)))); \ 58123 __ret_703 = __builtin_shufflevector(__ret_703, __ret_703, 3, 2, 1, 0); \ 58124 __ret_703; \ 58125 }) 58126 #endif 58127 58128 #ifdef __LITTLE_ENDIAN__ 58129 #define vqrshrun_high_n_s16(__p0_704, __p1_704, __p2_704) __extension__ ({ \ 58130 int8x16_t __ret_704; \ 58131 int8x8_t __s0_704 = __p0_704; \ 58132 int16x8_t __s1_704 = __p1_704; \ 58133 __ret_704 = (int8x16_t)(vcombine_s8((int8x8_t)(__s0_704), (int8x8_t)(vqrshrun_n_s16(__s1_704, __p2_704)))); \ 58134 __ret_704; \ 58135 }) 58136 #else 58137 #define vqrshrun_high_n_s16(__p0_705, __p1_705, __p2_705) __extension__ ({ \ 58138 int8x16_t __ret_705; \ 58139 int8x8_t __s0_705 = __p0_705; \ 58140 int16x8_t __s1_705 = __p1_705; \ 58141 int8x8_t __rev0_705; __rev0_705 = __builtin_shufflevector(__s0_705, __s0_705, 7, 6, 5, 4, 3, 2, 1, 0); \ 58142 int16x8_t __rev1_705; __rev1_705 = __builtin_shufflevector(__s1_705, __s1_705, 7, 6, 5, 4, 3, 2, 1, 0); \ 58143 __ret_705 = (int8x16_t)(__noswap_vcombine_s8((int8x8_t)(__rev0_705), (int8x8_t)(__noswap_vqrshrun_n_s16(__rev1_705, __p2_705)))); \ 58144 __ret_705 = __builtin_shufflevector(__ret_705, __ret_705, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 58145 __ret_705; \ 58146 }) 58147 #endif 58148 58149 #define vqrshruns_n_s32(__p0, __p1) __extension__ ({ \ 58150 uint16_t __ret; \ 58151 int32_t __s0 = __p0; \ 58152 __ret = (uint16_t) __builtin_neon_vqrshruns_n_s32(__s0, __p1); \ 58153 __ret; \ 58154 }) 58155 #define vqrshrund_n_s64(__p0, __p1) __extension__ ({ \ 58156 uint32_t __ret; \ 58157 int64_t __s0 = __p0; \ 58158 __ret = (uint32_t) __builtin_neon_vqrshrund_n_s64(__s0, __p1); \ 58159 __ret; \ 58160 }) 58161 #define vqrshrunh_n_s16(__p0, __p1) __extension__ ({ \ 58162 uint8_t __ret; \ 58163 int16_t __s0 = __p0; \ 58164 __ret = (uint8_t) __builtin_neon_vqrshrunh_n_s16(__s0, __p1); \ 58165 __ret; \ 58166 }) 58167 __ai __attribute__((target("neon"))) uint8_t vqshlb_u8(uint8_t __p0, int8_t __p1) { 58168 uint8_t __ret; 58169 __ret = (uint8_t) __builtin_neon_vqshlb_u8(__p0, __p1); 58170 return __ret; 58171 } 58172 __ai __attribute__((target("neon"))) uint32_t vqshls_u32(uint32_t __p0, int32_t __p1) { 58173 uint32_t __ret; 58174 __ret = (uint32_t) __builtin_neon_vqshls_u32(__p0, __p1); 58175 return __ret; 58176 } 58177 __ai __attribute__((target("neon"))) uint64_t vqshld_u64(uint64_t __p0, int64_t __p1) { 58178 uint64_t __ret; 58179 __ret = (uint64_t) __builtin_neon_vqshld_u64(__p0, __p1); 58180 return __ret; 58181 } 58182 __ai __attribute__((target("neon"))) uint16_t vqshlh_u16(uint16_t __p0, int16_t __p1) { 58183 uint16_t __ret; 58184 __ret = (uint16_t) __builtin_neon_vqshlh_u16(__p0, __p1); 58185 return __ret; 58186 } 58187 __ai __attribute__((target("neon"))) int8_t vqshlb_s8(int8_t __p0, int8_t __p1) { 58188 int8_t __ret; 58189 __ret = (int8_t) __builtin_neon_vqshlb_s8(__p0, __p1); 58190 return __ret; 58191 } 58192 __ai __attribute__((target("neon"))) int32_t vqshls_s32(int32_t __p0, int32_t __p1) { 58193 int32_t __ret; 58194 __ret = (int32_t) __builtin_neon_vqshls_s32(__p0, __p1); 58195 return __ret; 58196 } 58197 __ai __attribute__((target("neon"))) int64_t vqshld_s64(int64_t __p0, int64_t __p1) { 58198 int64_t __ret; 58199 __ret = (int64_t) __builtin_neon_vqshld_s64(__p0, __p1); 58200 return __ret; 58201 } 58202 __ai __attribute__((target("neon"))) int16_t vqshlh_s16(int16_t __p0, int16_t __p1) { 58203 int16_t __ret; 58204 __ret = (int16_t) __builtin_neon_vqshlh_s16(__p0, __p1); 58205 return __ret; 58206 } 58207 #define vqshlb_n_u8(__p0, __p1) __extension__ ({ \ 58208 uint8_t __ret; \ 58209 uint8_t __s0 = __p0; \ 58210 __ret = (uint8_t) __builtin_neon_vqshlb_n_u8(__s0, __p1); \ 58211 __ret; \ 58212 }) 58213 #define vqshls_n_u32(__p0, __p1) __extension__ ({ \ 58214 uint32_t __ret; \ 58215 uint32_t __s0 = __p0; \ 58216 __ret = (uint32_t) __builtin_neon_vqshls_n_u32(__s0, __p1); \ 58217 __ret; \ 58218 }) 58219 #define vqshld_n_u64(__p0, __p1) __extension__ ({ \ 58220 uint64_t __ret; \ 58221 uint64_t __s0 = __p0; \ 58222 __ret = (uint64_t) __builtin_neon_vqshld_n_u64(__s0, __p1); \ 58223 __ret; \ 58224 }) 58225 #define vqshlh_n_u16(__p0, __p1) __extension__ ({ \ 58226 uint16_t __ret; \ 58227 uint16_t __s0 = __p0; \ 58228 __ret = (uint16_t) __builtin_neon_vqshlh_n_u16(__s0, __p1); \ 58229 __ret; \ 58230 }) 58231 #define vqshlb_n_s8(__p0, __p1) __extension__ ({ \ 58232 int8_t __ret; \ 58233 int8_t __s0 = __p0; \ 58234 __ret = (int8_t) __builtin_neon_vqshlb_n_s8(__s0, __p1); \ 58235 __ret; \ 58236 }) 58237 #define vqshls_n_s32(__p0, __p1) __extension__ ({ \ 58238 int32_t __ret; \ 58239 int32_t __s0 = __p0; \ 58240 __ret = (int32_t) __builtin_neon_vqshls_n_s32(__s0, __p1); \ 58241 __ret; \ 58242 }) 58243 #define vqshld_n_s64(__p0, __p1) __extension__ ({ \ 58244 int64_t __ret; \ 58245 int64_t __s0 = __p0; \ 58246 __ret = (int64_t) __builtin_neon_vqshld_n_s64(__s0, __p1); \ 58247 __ret; \ 58248 }) 58249 #define vqshlh_n_s16(__p0, __p1) __extension__ ({ \ 58250 int16_t __ret; \ 58251 int16_t __s0 = __p0; \ 58252 __ret = (int16_t) __builtin_neon_vqshlh_n_s16(__s0, __p1); \ 58253 __ret; \ 58254 }) 58255 #define vqshlub_n_s8(__p0, __p1) __extension__ ({ \ 58256 int8_t __ret; \ 58257 int8_t __s0 = __p0; \ 58258 __ret = (int8_t) __builtin_neon_vqshlub_n_s8(__s0, __p1); \ 58259 __ret; \ 58260 }) 58261 #define vqshlus_n_s32(__p0, __p1) __extension__ ({ \ 58262 int32_t __ret; \ 58263 int32_t __s0 = __p0; \ 58264 __ret = (int32_t) __builtin_neon_vqshlus_n_s32(__s0, __p1); \ 58265 __ret; \ 58266 }) 58267 #define vqshlud_n_s64(__p0, __p1) __extension__ ({ \ 58268 int64_t __ret; \ 58269 int64_t __s0 = __p0; \ 58270 __ret = (int64_t) __builtin_neon_vqshlud_n_s64(__s0, __p1); \ 58271 __ret; \ 58272 }) 58273 #define vqshluh_n_s16(__p0, __p1) __extension__ ({ \ 58274 int16_t __ret; \ 58275 int16_t __s0 = __p0; \ 58276 __ret = (int16_t) __builtin_neon_vqshluh_n_s16(__s0, __p1); \ 58277 __ret; \ 58278 }) 58279 #ifdef __LITTLE_ENDIAN__ 58280 #define vqshrn_high_n_u32(__p0_706, __p1_706, __p2_706) __extension__ ({ \ 58281 uint16x8_t __ret_706; \ 58282 uint16x4_t __s0_706 = __p0_706; \ 58283 uint32x4_t __s1_706 = __p1_706; \ 58284 __ret_706 = (uint16x8_t)(vcombine_u16((uint16x4_t)(__s0_706), (uint16x4_t)(vqshrn_n_u32(__s1_706, __p2_706)))); \ 58285 __ret_706; \ 58286 }) 58287 #else 58288 #define vqshrn_high_n_u32(__p0_707, __p1_707, __p2_707) __extension__ ({ \ 58289 uint16x8_t __ret_707; \ 58290 uint16x4_t __s0_707 = __p0_707; \ 58291 uint32x4_t __s1_707 = __p1_707; \ 58292 uint16x4_t __rev0_707; __rev0_707 = __builtin_shufflevector(__s0_707, __s0_707, 3, 2, 1, 0); \ 58293 uint32x4_t __rev1_707; __rev1_707 = __builtin_shufflevector(__s1_707, __s1_707, 3, 2, 1, 0); \ 58294 __ret_707 = (uint16x8_t)(__noswap_vcombine_u16((uint16x4_t)(__rev0_707), (uint16x4_t)(__noswap_vqshrn_n_u32(__rev1_707, __p2_707)))); \ 58295 __ret_707 = __builtin_shufflevector(__ret_707, __ret_707, 7, 6, 5, 4, 3, 2, 1, 0); \ 58296 __ret_707; \ 58297 }) 58298 #endif 58299 58300 #ifdef __LITTLE_ENDIAN__ 58301 #define vqshrn_high_n_u64(__p0_708, __p1_708, __p2_708) __extension__ ({ \ 58302 uint32x4_t __ret_708; \ 58303 uint32x2_t __s0_708 = __p0_708; \ 58304 uint64x2_t __s1_708 = __p1_708; \ 58305 __ret_708 = (uint32x4_t)(vcombine_u32((uint32x2_t)(__s0_708), (uint32x2_t)(vqshrn_n_u64(__s1_708, __p2_708)))); \ 58306 __ret_708; \ 58307 }) 58308 #else 58309 #define vqshrn_high_n_u64(__p0_709, __p1_709, __p2_709) __extension__ ({ \ 58310 uint32x4_t __ret_709; \ 58311 uint32x2_t __s0_709 = __p0_709; \ 58312 uint64x2_t __s1_709 = __p1_709; \ 58313 uint32x2_t __rev0_709; __rev0_709 = __builtin_shufflevector(__s0_709, __s0_709, 1, 0); \ 58314 uint64x2_t __rev1_709; __rev1_709 = __builtin_shufflevector(__s1_709, __s1_709, 1, 0); \ 58315 __ret_709 = (uint32x4_t)(__noswap_vcombine_u32((uint32x2_t)(__rev0_709), (uint32x2_t)(__noswap_vqshrn_n_u64(__rev1_709, __p2_709)))); \ 58316 __ret_709 = __builtin_shufflevector(__ret_709, __ret_709, 3, 2, 1, 0); \ 58317 __ret_709; \ 58318 }) 58319 #endif 58320 58321 #ifdef __LITTLE_ENDIAN__ 58322 #define vqshrn_high_n_u16(__p0_710, __p1_710, __p2_710) __extension__ ({ \ 58323 uint8x16_t __ret_710; \ 58324 uint8x8_t __s0_710 = __p0_710; \ 58325 uint16x8_t __s1_710 = __p1_710; \ 58326 __ret_710 = (uint8x16_t)(vcombine_u8((uint8x8_t)(__s0_710), (uint8x8_t)(vqshrn_n_u16(__s1_710, __p2_710)))); \ 58327 __ret_710; \ 58328 }) 58329 #else 58330 #define vqshrn_high_n_u16(__p0_711, __p1_711, __p2_711) __extension__ ({ \ 58331 uint8x16_t __ret_711; \ 58332 uint8x8_t __s0_711 = __p0_711; \ 58333 uint16x8_t __s1_711 = __p1_711; \ 58334 uint8x8_t __rev0_711; __rev0_711 = __builtin_shufflevector(__s0_711, __s0_711, 7, 6, 5, 4, 3, 2, 1, 0); \ 58335 uint16x8_t __rev1_711; __rev1_711 = __builtin_shufflevector(__s1_711, __s1_711, 7, 6, 5, 4, 3, 2, 1, 0); \ 58336 __ret_711 = (uint8x16_t)(__noswap_vcombine_u8((uint8x8_t)(__rev0_711), (uint8x8_t)(__noswap_vqshrn_n_u16(__rev1_711, __p2_711)))); \ 58337 __ret_711 = __builtin_shufflevector(__ret_711, __ret_711, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 58338 __ret_711; \ 58339 }) 58340 #endif 58341 58342 #ifdef __LITTLE_ENDIAN__ 58343 #define vqshrn_high_n_s32(__p0_712, __p1_712, __p2_712) __extension__ ({ \ 58344 int16x8_t __ret_712; \ 58345 int16x4_t __s0_712 = __p0_712; \ 58346 int32x4_t __s1_712 = __p1_712; \ 58347 __ret_712 = (int16x8_t)(vcombine_s16((int16x4_t)(__s0_712), (int16x4_t)(vqshrn_n_s32(__s1_712, __p2_712)))); \ 58348 __ret_712; \ 58349 }) 58350 #else 58351 #define vqshrn_high_n_s32(__p0_713, __p1_713, __p2_713) __extension__ ({ \ 58352 int16x8_t __ret_713; \ 58353 int16x4_t __s0_713 = __p0_713; \ 58354 int32x4_t __s1_713 = __p1_713; \ 58355 int16x4_t __rev0_713; __rev0_713 = __builtin_shufflevector(__s0_713, __s0_713, 3, 2, 1, 0); \ 58356 int32x4_t __rev1_713; __rev1_713 = __builtin_shufflevector(__s1_713, __s1_713, 3, 2, 1, 0); \ 58357 __ret_713 = (int16x8_t)(__noswap_vcombine_s16((int16x4_t)(__rev0_713), (int16x4_t)(__noswap_vqshrn_n_s32(__rev1_713, __p2_713)))); \ 58358 __ret_713 = __builtin_shufflevector(__ret_713, __ret_713, 7, 6, 5, 4, 3, 2, 1, 0); \ 58359 __ret_713; \ 58360 }) 58361 #endif 58362 58363 #ifdef __LITTLE_ENDIAN__ 58364 #define vqshrn_high_n_s64(__p0_714, __p1_714, __p2_714) __extension__ ({ \ 58365 int32x4_t __ret_714; \ 58366 int32x2_t __s0_714 = __p0_714; \ 58367 int64x2_t __s1_714 = __p1_714; \ 58368 __ret_714 = (int32x4_t)(vcombine_s32((int32x2_t)(__s0_714), (int32x2_t)(vqshrn_n_s64(__s1_714, __p2_714)))); \ 58369 __ret_714; \ 58370 }) 58371 #else 58372 #define vqshrn_high_n_s64(__p0_715, __p1_715, __p2_715) __extension__ ({ \ 58373 int32x4_t __ret_715; \ 58374 int32x2_t __s0_715 = __p0_715; \ 58375 int64x2_t __s1_715 = __p1_715; \ 58376 int32x2_t __rev0_715; __rev0_715 = __builtin_shufflevector(__s0_715, __s0_715, 1, 0); \ 58377 int64x2_t __rev1_715; __rev1_715 = __builtin_shufflevector(__s1_715, __s1_715, 1, 0); \ 58378 __ret_715 = (int32x4_t)(__noswap_vcombine_s32((int32x2_t)(__rev0_715), (int32x2_t)(__noswap_vqshrn_n_s64(__rev1_715, __p2_715)))); \ 58379 __ret_715 = __builtin_shufflevector(__ret_715, __ret_715, 3, 2, 1, 0); \ 58380 __ret_715; \ 58381 }) 58382 #endif 58383 58384 #ifdef __LITTLE_ENDIAN__ 58385 #define vqshrn_high_n_s16(__p0_716, __p1_716, __p2_716) __extension__ ({ \ 58386 int8x16_t __ret_716; \ 58387 int8x8_t __s0_716 = __p0_716; \ 58388 int16x8_t __s1_716 = __p1_716; \ 58389 __ret_716 = (int8x16_t)(vcombine_s8((int8x8_t)(__s0_716), (int8x8_t)(vqshrn_n_s16(__s1_716, __p2_716)))); \ 58390 __ret_716; \ 58391 }) 58392 #else 58393 #define vqshrn_high_n_s16(__p0_717, __p1_717, __p2_717) __extension__ ({ \ 58394 int8x16_t __ret_717; \ 58395 int8x8_t __s0_717 = __p0_717; \ 58396 int16x8_t __s1_717 = __p1_717; \ 58397 int8x8_t __rev0_717; __rev0_717 = __builtin_shufflevector(__s0_717, __s0_717, 7, 6, 5, 4, 3, 2, 1, 0); \ 58398 int16x8_t __rev1_717; __rev1_717 = __builtin_shufflevector(__s1_717, __s1_717, 7, 6, 5, 4, 3, 2, 1, 0); \ 58399 __ret_717 = (int8x16_t)(__noswap_vcombine_s8((int8x8_t)(__rev0_717), (int8x8_t)(__noswap_vqshrn_n_s16(__rev1_717, __p2_717)))); \ 58400 __ret_717 = __builtin_shufflevector(__ret_717, __ret_717, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 58401 __ret_717; \ 58402 }) 58403 #endif 58404 58405 #define vqshrns_n_u32(__p0, __p1) __extension__ ({ \ 58406 uint16_t __ret; \ 58407 uint32_t __s0 = __p0; \ 58408 __ret = (uint16_t) __builtin_neon_vqshrns_n_u32(__s0, __p1); \ 58409 __ret; \ 58410 }) 58411 #define vqshrnd_n_u64(__p0, __p1) __extension__ ({ \ 58412 uint32_t __ret; \ 58413 uint64_t __s0 = __p0; \ 58414 __ret = (uint32_t) __builtin_neon_vqshrnd_n_u64(__s0, __p1); \ 58415 __ret; \ 58416 }) 58417 #define vqshrnh_n_u16(__p0, __p1) __extension__ ({ \ 58418 uint8_t __ret; \ 58419 uint16_t __s0 = __p0; \ 58420 __ret = (uint8_t) __builtin_neon_vqshrnh_n_u16(__s0, __p1); \ 58421 __ret; \ 58422 }) 58423 #define vqshrns_n_s32(__p0, __p1) __extension__ ({ \ 58424 int16_t __ret; \ 58425 int32_t __s0 = __p0; \ 58426 __ret = (int16_t) __builtin_neon_vqshrns_n_s32(__s0, __p1); \ 58427 __ret; \ 58428 }) 58429 #define vqshrnd_n_s64(__p0, __p1) __extension__ ({ \ 58430 int32_t __ret; \ 58431 int64_t __s0 = __p0; \ 58432 __ret = (int32_t) __builtin_neon_vqshrnd_n_s64(__s0, __p1); \ 58433 __ret; \ 58434 }) 58435 #define vqshrnh_n_s16(__p0, __p1) __extension__ ({ \ 58436 int8_t __ret; \ 58437 int16_t __s0 = __p0; \ 58438 __ret = (int8_t) __builtin_neon_vqshrnh_n_s16(__s0, __p1); \ 58439 __ret; \ 58440 }) 58441 #ifdef __LITTLE_ENDIAN__ 58442 #define vqshrun_high_n_s32(__p0_718, __p1_718, __p2_718) __extension__ ({ \ 58443 int16x8_t __ret_718; \ 58444 int16x4_t __s0_718 = __p0_718; \ 58445 int32x4_t __s1_718 = __p1_718; \ 58446 __ret_718 = (int16x8_t)(vcombine_s16((int16x4_t)(__s0_718), (int16x4_t)(vqshrun_n_s32(__s1_718, __p2_718)))); \ 58447 __ret_718; \ 58448 }) 58449 #else 58450 #define vqshrun_high_n_s32(__p0_719, __p1_719, __p2_719) __extension__ ({ \ 58451 int16x8_t __ret_719; \ 58452 int16x4_t __s0_719 = __p0_719; \ 58453 int32x4_t __s1_719 = __p1_719; \ 58454 int16x4_t __rev0_719; __rev0_719 = __builtin_shufflevector(__s0_719, __s0_719, 3, 2, 1, 0); \ 58455 int32x4_t __rev1_719; __rev1_719 = __builtin_shufflevector(__s1_719, __s1_719, 3, 2, 1, 0); \ 58456 __ret_719 = (int16x8_t)(__noswap_vcombine_s16((int16x4_t)(__rev0_719), (int16x4_t)(__noswap_vqshrun_n_s32(__rev1_719, __p2_719)))); \ 58457 __ret_719 = __builtin_shufflevector(__ret_719, __ret_719, 7, 6, 5, 4, 3, 2, 1, 0); \ 58458 __ret_719; \ 58459 }) 58460 #endif 58461 58462 #ifdef __LITTLE_ENDIAN__ 58463 #define vqshrun_high_n_s64(__p0_720, __p1_720, __p2_720) __extension__ ({ \ 58464 int32x4_t __ret_720; \ 58465 int32x2_t __s0_720 = __p0_720; \ 58466 int64x2_t __s1_720 = __p1_720; \ 58467 __ret_720 = (int32x4_t)(vcombine_s32((int32x2_t)(__s0_720), (int32x2_t)(vqshrun_n_s64(__s1_720, __p2_720)))); \ 58468 __ret_720; \ 58469 }) 58470 #else 58471 #define vqshrun_high_n_s64(__p0_721, __p1_721, __p2_721) __extension__ ({ \ 58472 int32x4_t __ret_721; \ 58473 int32x2_t __s0_721 = __p0_721; \ 58474 int64x2_t __s1_721 = __p1_721; \ 58475 int32x2_t __rev0_721; __rev0_721 = __builtin_shufflevector(__s0_721, __s0_721, 1, 0); \ 58476 int64x2_t __rev1_721; __rev1_721 = __builtin_shufflevector(__s1_721, __s1_721, 1, 0); \ 58477 __ret_721 = (int32x4_t)(__noswap_vcombine_s32((int32x2_t)(__rev0_721), (int32x2_t)(__noswap_vqshrun_n_s64(__rev1_721, __p2_721)))); \ 58478 __ret_721 = __builtin_shufflevector(__ret_721, __ret_721, 3, 2, 1, 0); \ 58479 __ret_721; \ 58480 }) 58481 #endif 58482 58483 #ifdef __LITTLE_ENDIAN__ 58484 #define vqshrun_high_n_s16(__p0_722, __p1_722, __p2_722) __extension__ ({ \ 58485 int8x16_t __ret_722; \ 58486 int8x8_t __s0_722 = __p0_722; \ 58487 int16x8_t __s1_722 = __p1_722; \ 58488 __ret_722 = (int8x16_t)(vcombine_s8((int8x8_t)(__s0_722), (int8x8_t)(vqshrun_n_s16(__s1_722, __p2_722)))); \ 58489 __ret_722; \ 58490 }) 58491 #else 58492 #define vqshrun_high_n_s16(__p0_723, __p1_723, __p2_723) __extension__ ({ \ 58493 int8x16_t __ret_723; \ 58494 int8x8_t __s0_723 = __p0_723; \ 58495 int16x8_t __s1_723 = __p1_723; \ 58496 int8x8_t __rev0_723; __rev0_723 = __builtin_shufflevector(__s0_723, __s0_723, 7, 6, 5, 4, 3, 2, 1, 0); \ 58497 int16x8_t __rev1_723; __rev1_723 = __builtin_shufflevector(__s1_723, __s1_723, 7, 6, 5, 4, 3, 2, 1, 0); \ 58498 __ret_723 = (int8x16_t)(__noswap_vcombine_s8((int8x8_t)(__rev0_723), (int8x8_t)(__noswap_vqshrun_n_s16(__rev1_723, __p2_723)))); \ 58499 __ret_723 = __builtin_shufflevector(__ret_723, __ret_723, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 58500 __ret_723; \ 58501 }) 58502 #endif 58503 58504 #define vqshruns_n_s32(__p0, __p1) __extension__ ({ \ 58505 uint16_t __ret; \ 58506 int32_t __s0 = __p0; \ 58507 __ret = (uint16_t) __builtin_neon_vqshruns_n_s32(__s0, __p1); \ 58508 __ret; \ 58509 }) 58510 #define vqshrund_n_s64(__p0, __p1) __extension__ ({ \ 58511 uint32_t __ret; \ 58512 int64_t __s0 = __p0; \ 58513 __ret = (uint32_t) __builtin_neon_vqshrund_n_s64(__s0, __p1); \ 58514 __ret; \ 58515 }) 58516 #define vqshrunh_n_s16(__p0, __p1) __extension__ ({ \ 58517 uint8_t __ret; \ 58518 int16_t __s0 = __p0; \ 58519 __ret = (uint8_t) __builtin_neon_vqshrunh_n_s16(__s0, __p1); \ 58520 __ret; \ 58521 }) 58522 __ai __attribute__((target("neon"))) uint8_t vqsubb_u8(uint8_t __p0, uint8_t __p1) { 58523 uint8_t __ret; 58524 __ret = (uint8_t) __builtin_neon_vqsubb_u8(__p0, __p1); 58525 return __ret; 58526 } 58527 __ai __attribute__((target("neon"))) uint32_t vqsubs_u32(uint32_t __p0, uint32_t __p1) { 58528 uint32_t __ret; 58529 __ret = (uint32_t) __builtin_neon_vqsubs_u32(__p0, __p1); 58530 return __ret; 58531 } 58532 __ai __attribute__((target("neon"))) uint64_t vqsubd_u64(uint64_t __p0, uint64_t __p1) { 58533 uint64_t __ret; 58534 __ret = (uint64_t) __builtin_neon_vqsubd_u64(__p0, __p1); 58535 return __ret; 58536 } 58537 __ai __attribute__((target("neon"))) uint16_t vqsubh_u16(uint16_t __p0, uint16_t __p1) { 58538 uint16_t __ret; 58539 __ret = (uint16_t) __builtin_neon_vqsubh_u16(__p0, __p1); 58540 return __ret; 58541 } 58542 __ai __attribute__((target("neon"))) int8_t vqsubb_s8(int8_t __p0, int8_t __p1) { 58543 int8_t __ret; 58544 __ret = (int8_t) __builtin_neon_vqsubb_s8(__p0, __p1); 58545 return __ret; 58546 } 58547 __ai __attribute__((target("neon"))) int32_t vqsubs_s32(int32_t __p0, int32_t __p1) { 58548 int32_t __ret; 58549 __ret = (int32_t) __builtin_neon_vqsubs_s32(__p0, __p1); 58550 return __ret; 58551 } 58552 __ai __attribute__((target("neon"))) int64_t vqsubd_s64(int64_t __p0, int64_t __p1) { 58553 int64_t __ret; 58554 __ret = (int64_t) __builtin_neon_vqsubd_s64(__p0, __p1); 58555 return __ret; 58556 } 58557 __ai __attribute__((target("neon"))) int16_t vqsubh_s16(int16_t __p0, int16_t __p1) { 58558 int16_t __ret; 58559 __ret = (int16_t) __builtin_neon_vqsubh_s16(__p0, __p1); 58560 return __ret; 58561 } 58562 #ifdef __LITTLE_ENDIAN__ 58563 __ai __attribute__((target("neon"))) poly8x8_t vqtbl1_p8(poly8x16_t __p0, uint8x8_t __p1) { 58564 poly8x8_t __ret; 58565 __ret = (poly8x8_t) __builtin_neon_vqtbl1_v((int8x16_t)__p0, (int8x8_t)__p1, 4); 58566 return __ret; 58567 } 58568 #else 58569 __ai __attribute__((target("neon"))) poly8x8_t vqtbl1_p8(poly8x16_t __p0, uint8x8_t __p1) { 58570 poly8x8_t __ret; 58571 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58572 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 58573 __ret = (poly8x8_t) __builtin_neon_vqtbl1_v((int8x16_t)__rev0, (int8x8_t)__rev1, 4); 58574 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 58575 return __ret; 58576 } 58577 #endif 58578 58579 #ifdef __LITTLE_ENDIAN__ 58580 __ai __attribute__((target("neon"))) poly8x16_t vqtbl1q_p8(poly8x16_t __p0, uint8x16_t __p1) { 58581 poly8x16_t __ret; 58582 __ret = (poly8x16_t) __builtin_neon_vqtbl1q_v((int8x16_t)__p0, (int8x16_t)__p1, 36); 58583 return __ret; 58584 } 58585 #else 58586 __ai __attribute__((target("neon"))) poly8x16_t vqtbl1q_p8(poly8x16_t __p0, uint8x16_t __p1) { 58587 poly8x16_t __ret; 58588 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58589 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58590 __ret = (poly8x16_t) __builtin_neon_vqtbl1q_v((int8x16_t)__rev0, (int8x16_t)__rev1, 36); 58591 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58592 return __ret; 58593 } 58594 #endif 58595 58596 #ifdef __LITTLE_ENDIAN__ 58597 __ai __attribute__((target("neon"))) uint8x16_t vqtbl1q_u8(uint8x16_t __p0, uint8x16_t __p1) { 58598 uint8x16_t __ret; 58599 __ret = (uint8x16_t) __builtin_neon_vqtbl1q_v((int8x16_t)__p0, (int8x16_t)__p1, 48); 58600 return __ret; 58601 } 58602 #else 58603 __ai __attribute__((target("neon"))) uint8x16_t vqtbl1q_u8(uint8x16_t __p0, uint8x16_t __p1) { 58604 uint8x16_t __ret; 58605 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58606 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58607 __ret = (uint8x16_t) __builtin_neon_vqtbl1q_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48); 58608 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58609 return __ret; 58610 } 58611 #endif 58612 58613 #ifdef __LITTLE_ENDIAN__ 58614 __ai __attribute__((target("neon"))) int8x16_t vqtbl1q_s8(int8x16_t __p0, uint8x16_t __p1) { 58615 int8x16_t __ret; 58616 __ret = (int8x16_t) __builtin_neon_vqtbl1q_v((int8x16_t)__p0, (int8x16_t)__p1, 32); 58617 return __ret; 58618 } 58619 #else 58620 __ai __attribute__((target("neon"))) int8x16_t vqtbl1q_s8(int8x16_t __p0, uint8x16_t __p1) { 58621 int8x16_t __ret; 58622 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58623 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58624 __ret = (int8x16_t) __builtin_neon_vqtbl1q_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32); 58625 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58626 return __ret; 58627 } 58628 #endif 58629 58630 #ifdef __LITTLE_ENDIAN__ 58631 __ai __attribute__((target("neon"))) uint8x8_t vqtbl1_u8(uint8x16_t __p0, uint8x8_t __p1) { 58632 uint8x8_t __ret; 58633 __ret = (uint8x8_t) __builtin_neon_vqtbl1_v((int8x16_t)__p0, (int8x8_t)__p1, 16); 58634 return __ret; 58635 } 58636 #else 58637 __ai __attribute__((target("neon"))) uint8x8_t vqtbl1_u8(uint8x16_t __p0, uint8x8_t __p1) { 58638 uint8x8_t __ret; 58639 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58640 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 58641 __ret = (uint8x8_t) __builtin_neon_vqtbl1_v((int8x16_t)__rev0, (int8x8_t)__rev1, 16); 58642 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 58643 return __ret; 58644 } 58645 #endif 58646 58647 #ifdef __LITTLE_ENDIAN__ 58648 __ai __attribute__((target("neon"))) int8x8_t vqtbl1_s8(int8x16_t __p0, uint8x8_t __p1) { 58649 int8x8_t __ret; 58650 __ret = (int8x8_t) __builtin_neon_vqtbl1_v((int8x16_t)__p0, (int8x8_t)__p1, 0); 58651 return __ret; 58652 } 58653 #else 58654 __ai __attribute__((target("neon"))) int8x8_t vqtbl1_s8(int8x16_t __p0, uint8x8_t __p1) { 58655 int8x8_t __ret; 58656 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58657 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 58658 __ret = (int8x8_t) __builtin_neon_vqtbl1_v((int8x16_t)__rev0, (int8x8_t)__rev1, 0); 58659 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 58660 return __ret; 58661 } 58662 #endif 58663 58664 #ifdef __LITTLE_ENDIAN__ 58665 __ai __attribute__((target("neon"))) poly8x8_t vqtbl2_p8(poly8x16x2_t __p0, uint8x8_t __p1) { 58666 poly8x8_t __ret; 58667 __ret = (poly8x8_t) __builtin_neon_vqtbl2_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x8_t)__p1, 4); 58668 return __ret; 58669 } 58670 #else 58671 __ai __attribute__((target("neon"))) poly8x8_t vqtbl2_p8(poly8x16x2_t __p0, uint8x8_t __p1) { 58672 poly8x8_t __ret; 58673 poly8x16x2_t __rev0; 58674 __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58675 __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58676 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 58677 __ret = (poly8x8_t) __builtin_neon_vqtbl2_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x8_t)__rev1, 4); 58678 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 58679 return __ret; 58680 } 58681 #endif 58682 58683 #ifdef __LITTLE_ENDIAN__ 58684 __ai __attribute__((target("neon"))) poly8x16_t vqtbl2q_p8(poly8x16x2_t __p0, uint8x16_t __p1) { 58685 poly8x16_t __ret; 58686 __ret = (poly8x16_t) __builtin_neon_vqtbl2q_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x16_t)__p1, 36); 58687 return __ret; 58688 } 58689 #else 58690 __ai __attribute__((target("neon"))) poly8x16_t vqtbl2q_p8(poly8x16x2_t __p0, uint8x16_t __p1) { 58691 poly8x16_t __ret; 58692 poly8x16x2_t __rev0; 58693 __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58694 __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58695 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58696 __ret = (poly8x16_t) __builtin_neon_vqtbl2q_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev1, 36); 58697 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58698 return __ret; 58699 } 58700 #endif 58701 58702 #ifdef __LITTLE_ENDIAN__ 58703 __ai __attribute__((target("neon"))) uint8x16_t vqtbl2q_u8(uint8x16x2_t __p0, uint8x16_t __p1) { 58704 uint8x16_t __ret; 58705 __ret = (uint8x16_t) __builtin_neon_vqtbl2q_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x16_t)__p1, 48); 58706 return __ret; 58707 } 58708 #else 58709 __ai __attribute__((target("neon"))) uint8x16_t vqtbl2q_u8(uint8x16x2_t __p0, uint8x16_t __p1) { 58710 uint8x16_t __ret; 58711 uint8x16x2_t __rev0; 58712 __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58713 __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58714 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58715 __ret = (uint8x16_t) __builtin_neon_vqtbl2q_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev1, 48); 58716 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58717 return __ret; 58718 } 58719 #endif 58720 58721 #ifdef __LITTLE_ENDIAN__ 58722 __ai __attribute__((target("neon"))) int8x16_t vqtbl2q_s8(int8x16x2_t __p0, uint8x16_t __p1) { 58723 int8x16_t __ret; 58724 __ret = (int8x16_t) __builtin_neon_vqtbl2q_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x16_t)__p1, 32); 58725 return __ret; 58726 } 58727 #else 58728 __ai __attribute__((target("neon"))) int8x16_t vqtbl2q_s8(int8x16x2_t __p0, uint8x16_t __p1) { 58729 int8x16_t __ret; 58730 int8x16x2_t __rev0; 58731 __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58732 __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58733 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58734 __ret = (int8x16_t) __builtin_neon_vqtbl2q_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev1, 32); 58735 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58736 return __ret; 58737 } 58738 #endif 58739 58740 #ifdef __LITTLE_ENDIAN__ 58741 __ai __attribute__((target("neon"))) uint8x8_t vqtbl2_u8(uint8x16x2_t __p0, uint8x8_t __p1) { 58742 uint8x8_t __ret; 58743 __ret = (uint8x8_t) __builtin_neon_vqtbl2_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x8_t)__p1, 16); 58744 return __ret; 58745 } 58746 #else 58747 __ai __attribute__((target("neon"))) uint8x8_t vqtbl2_u8(uint8x16x2_t __p0, uint8x8_t __p1) { 58748 uint8x8_t __ret; 58749 uint8x16x2_t __rev0; 58750 __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58751 __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58752 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 58753 __ret = (uint8x8_t) __builtin_neon_vqtbl2_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x8_t)__rev1, 16); 58754 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 58755 return __ret; 58756 } 58757 #endif 58758 58759 #ifdef __LITTLE_ENDIAN__ 58760 __ai __attribute__((target("neon"))) int8x8_t vqtbl2_s8(int8x16x2_t __p0, uint8x8_t __p1) { 58761 int8x8_t __ret; 58762 __ret = (int8x8_t) __builtin_neon_vqtbl2_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x8_t)__p1, 0); 58763 return __ret; 58764 } 58765 #else 58766 __ai __attribute__((target("neon"))) int8x8_t vqtbl2_s8(int8x16x2_t __p0, uint8x8_t __p1) { 58767 int8x8_t __ret; 58768 int8x16x2_t __rev0; 58769 __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58770 __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58771 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 58772 __ret = (int8x8_t) __builtin_neon_vqtbl2_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x8_t)__rev1, 0); 58773 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 58774 return __ret; 58775 } 58776 #endif 58777 58778 #ifdef __LITTLE_ENDIAN__ 58779 __ai __attribute__((target("neon"))) poly8x8_t vqtbl3_p8(poly8x16x3_t __p0, uint8x8_t __p1) { 58780 poly8x8_t __ret; 58781 __ret = (poly8x8_t) __builtin_neon_vqtbl3_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x16_t)__p0.val[2], (int8x8_t)__p1, 4); 58782 return __ret; 58783 } 58784 #else 58785 __ai __attribute__((target("neon"))) poly8x8_t vqtbl3_p8(poly8x16x3_t __p0, uint8x8_t __p1) { 58786 poly8x8_t __ret; 58787 poly8x16x3_t __rev0; 58788 __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58789 __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58790 __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58791 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 58792 __ret = (poly8x8_t) __builtin_neon_vqtbl3_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev0.val[2], (int8x8_t)__rev1, 4); 58793 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 58794 return __ret; 58795 } 58796 #endif 58797 58798 #ifdef __LITTLE_ENDIAN__ 58799 __ai __attribute__((target("neon"))) poly8x16_t vqtbl3q_p8(poly8x16x3_t __p0, uint8x16_t __p1) { 58800 poly8x16_t __ret; 58801 __ret = (poly8x16_t) __builtin_neon_vqtbl3q_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x16_t)__p0.val[2], (int8x16_t)__p1, 36); 58802 return __ret; 58803 } 58804 #else 58805 __ai __attribute__((target("neon"))) poly8x16_t vqtbl3q_p8(poly8x16x3_t __p0, uint8x16_t __p1) { 58806 poly8x16_t __ret; 58807 poly8x16x3_t __rev0; 58808 __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58809 __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58810 __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58811 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58812 __ret = (poly8x16_t) __builtin_neon_vqtbl3q_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev0.val[2], (int8x16_t)__rev1, 36); 58813 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58814 return __ret; 58815 } 58816 #endif 58817 58818 #ifdef __LITTLE_ENDIAN__ 58819 __ai __attribute__((target("neon"))) uint8x16_t vqtbl3q_u8(uint8x16x3_t __p0, uint8x16_t __p1) { 58820 uint8x16_t __ret; 58821 __ret = (uint8x16_t) __builtin_neon_vqtbl3q_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x16_t)__p0.val[2], (int8x16_t)__p1, 48); 58822 return __ret; 58823 } 58824 #else 58825 __ai __attribute__((target("neon"))) uint8x16_t vqtbl3q_u8(uint8x16x3_t __p0, uint8x16_t __p1) { 58826 uint8x16_t __ret; 58827 uint8x16x3_t __rev0; 58828 __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58829 __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58830 __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58831 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58832 __ret = (uint8x16_t) __builtin_neon_vqtbl3q_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev0.val[2], (int8x16_t)__rev1, 48); 58833 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58834 return __ret; 58835 } 58836 #endif 58837 58838 #ifdef __LITTLE_ENDIAN__ 58839 __ai __attribute__((target("neon"))) int8x16_t vqtbl3q_s8(int8x16x3_t __p0, uint8x16_t __p1) { 58840 int8x16_t __ret; 58841 __ret = (int8x16_t) __builtin_neon_vqtbl3q_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x16_t)__p0.val[2], (int8x16_t)__p1, 32); 58842 return __ret; 58843 } 58844 #else 58845 __ai __attribute__((target("neon"))) int8x16_t vqtbl3q_s8(int8x16x3_t __p0, uint8x16_t __p1) { 58846 int8x16_t __ret; 58847 int8x16x3_t __rev0; 58848 __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58849 __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58850 __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58851 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58852 __ret = (int8x16_t) __builtin_neon_vqtbl3q_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev0.val[2], (int8x16_t)__rev1, 32); 58853 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58854 return __ret; 58855 } 58856 #endif 58857 58858 #ifdef __LITTLE_ENDIAN__ 58859 __ai __attribute__((target("neon"))) uint8x8_t vqtbl3_u8(uint8x16x3_t __p0, uint8x8_t __p1) { 58860 uint8x8_t __ret; 58861 __ret = (uint8x8_t) __builtin_neon_vqtbl3_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x16_t)__p0.val[2], (int8x8_t)__p1, 16); 58862 return __ret; 58863 } 58864 #else 58865 __ai __attribute__((target("neon"))) uint8x8_t vqtbl3_u8(uint8x16x3_t __p0, uint8x8_t __p1) { 58866 uint8x8_t __ret; 58867 uint8x16x3_t __rev0; 58868 __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58869 __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58870 __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58871 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 58872 __ret = (uint8x8_t) __builtin_neon_vqtbl3_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev0.val[2], (int8x8_t)__rev1, 16); 58873 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 58874 return __ret; 58875 } 58876 #endif 58877 58878 #ifdef __LITTLE_ENDIAN__ 58879 __ai __attribute__((target("neon"))) int8x8_t vqtbl3_s8(int8x16x3_t __p0, uint8x8_t __p1) { 58880 int8x8_t __ret; 58881 __ret = (int8x8_t) __builtin_neon_vqtbl3_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x16_t)__p0.val[2], (int8x8_t)__p1, 0); 58882 return __ret; 58883 } 58884 #else 58885 __ai __attribute__((target("neon"))) int8x8_t vqtbl3_s8(int8x16x3_t __p0, uint8x8_t __p1) { 58886 int8x8_t __ret; 58887 int8x16x3_t __rev0; 58888 __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58889 __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58890 __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58891 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 58892 __ret = (int8x8_t) __builtin_neon_vqtbl3_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev0.val[2], (int8x8_t)__rev1, 0); 58893 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 58894 return __ret; 58895 } 58896 #endif 58897 58898 #ifdef __LITTLE_ENDIAN__ 58899 __ai __attribute__((target("neon"))) poly8x8_t vqtbl4_p8(poly8x16x4_t __p0, uint8x8_t __p1) { 58900 poly8x8_t __ret; 58901 __ret = (poly8x8_t) __builtin_neon_vqtbl4_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x16_t)__p0.val[2], (int8x16_t)__p0.val[3], (int8x8_t)__p1, 4); 58902 return __ret; 58903 } 58904 #else 58905 __ai __attribute__((target("neon"))) poly8x8_t vqtbl4_p8(poly8x16x4_t __p0, uint8x8_t __p1) { 58906 poly8x8_t __ret; 58907 poly8x16x4_t __rev0; 58908 __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58909 __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58910 __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58911 __rev0.val[3] = __builtin_shufflevector(__p0.val[3], __p0.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58912 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 58913 __ret = (poly8x8_t) __builtin_neon_vqtbl4_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev0.val[2], (int8x16_t)__rev0.val[3], (int8x8_t)__rev1, 4); 58914 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 58915 return __ret; 58916 } 58917 #endif 58918 58919 #ifdef __LITTLE_ENDIAN__ 58920 __ai __attribute__((target("neon"))) poly8x16_t vqtbl4q_p8(poly8x16x4_t __p0, uint8x16_t __p1) { 58921 poly8x16_t __ret; 58922 __ret = (poly8x16_t) __builtin_neon_vqtbl4q_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x16_t)__p0.val[2], (int8x16_t)__p0.val[3], (int8x16_t)__p1, 36); 58923 return __ret; 58924 } 58925 #else 58926 __ai __attribute__((target("neon"))) poly8x16_t vqtbl4q_p8(poly8x16x4_t __p0, uint8x16_t __p1) { 58927 poly8x16_t __ret; 58928 poly8x16x4_t __rev0; 58929 __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58930 __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58931 __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58932 __rev0.val[3] = __builtin_shufflevector(__p0.val[3], __p0.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58933 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58934 __ret = (poly8x16_t) __builtin_neon_vqtbl4q_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev0.val[2], (int8x16_t)__rev0.val[3], (int8x16_t)__rev1, 36); 58935 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58936 return __ret; 58937 } 58938 #endif 58939 58940 #ifdef __LITTLE_ENDIAN__ 58941 __ai __attribute__((target("neon"))) uint8x16_t vqtbl4q_u8(uint8x16x4_t __p0, uint8x16_t __p1) { 58942 uint8x16_t __ret; 58943 __ret = (uint8x16_t) __builtin_neon_vqtbl4q_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x16_t)__p0.val[2], (int8x16_t)__p0.val[3], (int8x16_t)__p1, 48); 58944 return __ret; 58945 } 58946 #else 58947 __ai __attribute__((target("neon"))) uint8x16_t vqtbl4q_u8(uint8x16x4_t __p0, uint8x16_t __p1) { 58948 uint8x16_t __ret; 58949 uint8x16x4_t __rev0; 58950 __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58951 __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58952 __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58953 __rev0.val[3] = __builtin_shufflevector(__p0.val[3], __p0.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58954 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58955 __ret = (uint8x16_t) __builtin_neon_vqtbl4q_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev0.val[2], (int8x16_t)__rev0.val[3], (int8x16_t)__rev1, 48); 58956 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58957 return __ret; 58958 } 58959 #endif 58960 58961 #ifdef __LITTLE_ENDIAN__ 58962 __ai __attribute__((target("neon"))) int8x16_t vqtbl4q_s8(int8x16x4_t __p0, uint8x16_t __p1) { 58963 int8x16_t __ret; 58964 __ret = (int8x16_t) __builtin_neon_vqtbl4q_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x16_t)__p0.val[2], (int8x16_t)__p0.val[3], (int8x16_t)__p1, 32); 58965 return __ret; 58966 } 58967 #else 58968 __ai __attribute__((target("neon"))) int8x16_t vqtbl4q_s8(int8x16x4_t __p0, uint8x16_t __p1) { 58969 int8x16_t __ret; 58970 int8x16x4_t __rev0; 58971 __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58972 __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58973 __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58974 __rev0.val[3] = __builtin_shufflevector(__p0.val[3], __p0.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58975 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58976 __ret = (int8x16_t) __builtin_neon_vqtbl4q_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev0.val[2], (int8x16_t)__rev0.val[3], (int8x16_t)__rev1, 32); 58977 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58978 return __ret; 58979 } 58980 #endif 58981 58982 #ifdef __LITTLE_ENDIAN__ 58983 __ai __attribute__((target("neon"))) uint8x8_t vqtbl4_u8(uint8x16x4_t __p0, uint8x8_t __p1) { 58984 uint8x8_t __ret; 58985 __ret = (uint8x8_t) __builtin_neon_vqtbl4_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x16_t)__p0.val[2], (int8x16_t)__p0.val[3], (int8x8_t)__p1, 16); 58986 return __ret; 58987 } 58988 #else 58989 __ai __attribute__((target("neon"))) uint8x8_t vqtbl4_u8(uint8x16x4_t __p0, uint8x8_t __p1) { 58990 uint8x8_t __ret; 58991 uint8x16x4_t __rev0; 58992 __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58993 __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58994 __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58995 __rev0.val[3] = __builtin_shufflevector(__p0.val[3], __p0.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 58996 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 58997 __ret = (uint8x8_t) __builtin_neon_vqtbl4_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev0.val[2], (int8x16_t)__rev0.val[3], (int8x8_t)__rev1, 16); 58998 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 58999 return __ret; 59000 } 59001 #endif 59002 59003 #ifdef __LITTLE_ENDIAN__ 59004 __ai __attribute__((target("neon"))) int8x8_t vqtbl4_s8(int8x16x4_t __p0, uint8x8_t __p1) { 59005 int8x8_t __ret; 59006 __ret = (int8x8_t) __builtin_neon_vqtbl4_v((int8x16_t)__p0.val[0], (int8x16_t)__p0.val[1], (int8x16_t)__p0.val[2], (int8x16_t)__p0.val[3], (int8x8_t)__p1, 0); 59007 return __ret; 59008 } 59009 #else 59010 __ai __attribute__((target("neon"))) int8x8_t vqtbl4_s8(int8x16x4_t __p0, uint8x8_t __p1) { 59011 int8x8_t __ret; 59012 int8x16x4_t __rev0; 59013 __rev0.val[0] = __builtin_shufflevector(__p0.val[0], __p0.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59014 __rev0.val[1] = __builtin_shufflevector(__p0.val[1], __p0.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59015 __rev0.val[2] = __builtin_shufflevector(__p0.val[2], __p0.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59016 __rev0.val[3] = __builtin_shufflevector(__p0.val[3], __p0.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59017 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 59018 __ret = (int8x8_t) __builtin_neon_vqtbl4_v((int8x16_t)__rev0.val[0], (int8x16_t)__rev0.val[1], (int8x16_t)__rev0.val[2], (int8x16_t)__rev0.val[3], (int8x8_t)__rev1, 0); 59019 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 59020 return __ret; 59021 } 59022 #endif 59023 59024 #ifdef __LITTLE_ENDIAN__ 59025 __ai __attribute__((target("neon"))) poly8x8_t vqtbx1_p8(poly8x8_t __p0, poly8x16_t __p1, uint8x8_t __p2) { 59026 poly8x8_t __ret; 59027 __ret = (poly8x8_t) __builtin_neon_vqtbx1_v((int8x8_t)__p0, (int8x16_t)__p1, (int8x8_t)__p2, 4); 59028 return __ret; 59029 } 59030 #else 59031 __ai __attribute__((target("neon"))) poly8x8_t vqtbx1_p8(poly8x8_t __p0, poly8x16_t __p1, uint8x8_t __p2) { 59032 poly8x8_t __ret; 59033 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 59034 poly8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59035 uint8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 59036 __ret = (poly8x8_t) __builtin_neon_vqtbx1_v((int8x8_t)__rev0, (int8x16_t)__rev1, (int8x8_t)__rev2, 4); 59037 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 59038 return __ret; 59039 } 59040 #endif 59041 59042 #ifdef __LITTLE_ENDIAN__ 59043 __ai __attribute__((target("neon"))) poly8x16_t vqtbx1q_p8(poly8x16_t __p0, poly8x16_t __p1, uint8x16_t __p2) { 59044 poly8x16_t __ret; 59045 __ret = (poly8x16_t) __builtin_neon_vqtbx1q_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 36); 59046 return __ret; 59047 } 59048 #else 59049 __ai __attribute__((target("neon"))) poly8x16_t vqtbx1q_p8(poly8x16_t __p0, poly8x16_t __p1, uint8x16_t __p2) { 59050 poly8x16_t __ret; 59051 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59052 poly8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59053 uint8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59054 __ret = (poly8x16_t) __builtin_neon_vqtbx1q_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 36); 59055 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59056 return __ret; 59057 } 59058 #endif 59059 59060 #ifdef __LITTLE_ENDIAN__ 59061 __ai __attribute__((target("neon"))) uint8x16_t vqtbx1q_u8(uint8x16_t __p0, uint8x16_t __p1, uint8x16_t __p2) { 59062 uint8x16_t __ret; 59063 __ret = (uint8x16_t) __builtin_neon_vqtbx1q_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 48); 59064 return __ret; 59065 } 59066 #else 59067 __ai __attribute__((target("neon"))) uint8x16_t vqtbx1q_u8(uint8x16_t __p0, uint8x16_t __p1, uint8x16_t __p2) { 59068 uint8x16_t __ret; 59069 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59070 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59071 uint8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59072 __ret = (uint8x16_t) __builtin_neon_vqtbx1q_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 48); 59073 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59074 return __ret; 59075 } 59076 #endif 59077 59078 #ifdef __LITTLE_ENDIAN__ 59079 __ai __attribute__((target("neon"))) int8x16_t vqtbx1q_s8(int8x16_t __p0, int8x16_t __p1, uint8x16_t __p2) { 59080 int8x16_t __ret; 59081 __ret = (int8x16_t) __builtin_neon_vqtbx1q_v((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 32); 59082 return __ret; 59083 } 59084 #else 59085 __ai __attribute__((target("neon"))) int8x16_t vqtbx1q_s8(int8x16_t __p0, int8x16_t __p1, uint8x16_t __p2) { 59086 int8x16_t __ret; 59087 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59088 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59089 uint8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59090 __ret = (int8x16_t) __builtin_neon_vqtbx1q_v((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 32); 59091 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59092 return __ret; 59093 } 59094 #endif 59095 59096 #ifdef __LITTLE_ENDIAN__ 59097 __ai __attribute__((target("neon"))) uint8x8_t vqtbx1_u8(uint8x8_t __p0, uint8x16_t __p1, uint8x8_t __p2) { 59098 uint8x8_t __ret; 59099 __ret = (uint8x8_t) __builtin_neon_vqtbx1_v((int8x8_t)__p0, (int8x16_t)__p1, (int8x8_t)__p2, 16); 59100 return __ret; 59101 } 59102 #else 59103 __ai __attribute__((target("neon"))) uint8x8_t vqtbx1_u8(uint8x8_t __p0, uint8x16_t __p1, uint8x8_t __p2) { 59104 uint8x8_t __ret; 59105 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 59106 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59107 uint8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 59108 __ret = (uint8x8_t) __builtin_neon_vqtbx1_v((int8x8_t)__rev0, (int8x16_t)__rev1, (int8x8_t)__rev2, 16); 59109 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 59110 return __ret; 59111 } 59112 #endif 59113 59114 #ifdef __LITTLE_ENDIAN__ 59115 __ai __attribute__((target("neon"))) int8x8_t vqtbx1_s8(int8x8_t __p0, int8x16_t __p1, uint8x8_t __p2) { 59116 int8x8_t __ret; 59117 __ret = (int8x8_t) __builtin_neon_vqtbx1_v((int8x8_t)__p0, (int8x16_t)__p1, (int8x8_t)__p2, 0); 59118 return __ret; 59119 } 59120 #else 59121 __ai __attribute__((target("neon"))) int8x8_t vqtbx1_s8(int8x8_t __p0, int8x16_t __p1, uint8x8_t __p2) { 59122 int8x8_t __ret; 59123 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 59124 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59125 uint8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 59126 __ret = (int8x8_t) __builtin_neon_vqtbx1_v((int8x8_t)__rev0, (int8x16_t)__rev1, (int8x8_t)__rev2, 0); 59127 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 59128 return __ret; 59129 } 59130 #endif 59131 59132 #ifdef __LITTLE_ENDIAN__ 59133 __ai __attribute__((target("neon"))) poly8x8_t vqtbx2_p8(poly8x8_t __p0, poly8x16x2_t __p1, uint8x8_t __p2) { 59134 poly8x8_t __ret; 59135 __ret = (poly8x8_t) __builtin_neon_vqtbx2_v((int8x8_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x8_t)__p2, 4); 59136 return __ret; 59137 } 59138 #else 59139 __ai __attribute__((target("neon"))) poly8x8_t vqtbx2_p8(poly8x8_t __p0, poly8x16x2_t __p1, uint8x8_t __p2) { 59140 poly8x8_t __ret; 59141 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 59142 poly8x16x2_t __rev1; 59143 __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59144 __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59145 uint8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 59146 __ret = (poly8x8_t) __builtin_neon_vqtbx2_v((int8x8_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x8_t)__rev2, 4); 59147 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 59148 return __ret; 59149 } 59150 #endif 59151 59152 #ifdef __LITTLE_ENDIAN__ 59153 __ai __attribute__((target("neon"))) poly8x16_t vqtbx2q_p8(poly8x16_t __p0, poly8x16x2_t __p1, uint8x16_t __p2) { 59154 poly8x16_t __ret; 59155 __ret = (poly8x16_t) __builtin_neon_vqtbx2q_v((int8x16_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x16_t)__p2, 36); 59156 return __ret; 59157 } 59158 #else 59159 __ai __attribute__((target("neon"))) poly8x16_t vqtbx2q_p8(poly8x16_t __p0, poly8x16x2_t __p1, uint8x16_t __p2) { 59160 poly8x16_t __ret; 59161 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59162 poly8x16x2_t __rev1; 59163 __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59164 __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59165 uint8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59166 __ret = (poly8x16_t) __builtin_neon_vqtbx2q_v((int8x16_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev2, 36); 59167 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59168 return __ret; 59169 } 59170 #endif 59171 59172 #ifdef __LITTLE_ENDIAN__ 59173 __ai __attribute__((target("neon"))) uint8x16_t vqtbx2q_u8(uint8x16_t __p0, uint8x16x2_t __p1, uint8x16_t __p2) { 59174 uint8x16_t __ret; 59175 __ret = (uint8x16_t) __builtin_neon_vqtbx2q_v((int8x16_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x16_t)__p2, 48); 59176 return __ret; 59177 } 59178 #else 59179 __ai __attribute__((target("neon"))) uint8x16_t vqtbx2q_u8(uint8x16_t __p0, uint8x16x2_t __p1, uint8x16_t __p2) { 59180 uint8x16_t __ret; 59181 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59182 uint8x16x2_t __rev1; 59183 __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59184 __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59185 uint8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59186 __ret = (uint8x16_t) __builtin_neon_vqtbx2q_v((int8x16_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev2, 48); 59187 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59188 return __ret; 59189 } 59190 #endif 59191 59192 #ifdef __LITTLE_ENDIAN__ 59193 __ai __attribute__((target("neon"))) int8x16_t vqtbx2q_s8(int8x16_t __p0, int8x16x2_t __p1, uint8x16_t __p2) { 59194 int8x16_t __ret; 59195 __ret = (int8x16_t) __builtin_neon_vqtbx2q_v((int8x16_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x16_t)__p2, 32); 59196 return __ret; 59197 } 59198 #else 59199 __ai __attribute__((target("neon"))) int8x16_t vqtbx2q_s8(int8x16_t __p0, int8x16x2_t __p1, uint8x16_t __p2) { 59200 int8x16_t __ret; 59201 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59202 int8x16x2_t __rev1; 59203 __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59204 __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59205 uint8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59206 __ret = (int8x16_t) __builtin_neon_vqtbx2q_v((int8x16_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev2, 32); 59207 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59208 return __ret; 59209 } 59210 #endif 59211 59212 #ifdef __LITTLE_ENDIAN__ 59213 __ai __attribute__((target("neon"))) uint8x8_t vqtbx2_u8(uint8x8_t __p0, uint8x16x2_t __p1, uint8x8_t __p2) { 59214 uint8x8_t __ret; 59215 __ret = (uint8x8_t) __builtin_neon_vqtbx2_v((int8x8_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x8_t)__p2, 16); 59216 return __ret; 59217 } 59218 #else 59219 __ai __attribute__((target("neon"))) uint8x8_t vqtbx2_u8(uint8x8_t __p0, uint8x16x2_t __p1, uint8x8_t __p2) { 59220 uint8x8_t __ret; 59221 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 59222 uint8x16x2_t __rev1; 59223 __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59224 __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59225 uint8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 59226 __ret = (uint8x8_t) __builtin_neon_vqtbx2_v((int8x8_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x8_t)__rev2, 16); 59227 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 59228 return __ret; 59229 } 59230 #endif 59231 59232 #ifdef __LITTLE_ENDIAN__ 59233 __ai __attribute__((target("neon"))) int8x8_t vqtbx2_s8(int8x8_t __p0, int8x16x2_t __p1, uint8x8_t __p2) { 59234 int8x8_t __ret; 59235 __ret = (int8x8_t) __builtin_neon_vqtbx2_v((int8x8_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x8_t)__p2, 0); 59236 return __ret; 59237 } 59238 #else 59239 __ai __attribute__((target("neon"))) int8x8_t vqtbx2_s8(int8x8_t __p0, int8x16x2_t __p1, uint8x8_t __p2) { 59240 int8x8_t __ret; 59241 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 59242 int8x16x2_t __rev1; 59243 __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59244 __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59245 uint8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 59246 __ret = (int8x8_t) __builtin_neon_vqtbx2_v((int8x8_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x8_t)__rev2, 0); 59247 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 59248 return __ret; 59249 } 59250 #endif 59251 59252 #ifdef __LITTLE_ENDIAN__ 59253 __ai __attribute__((target("neon"))) poly8x8_t vqtbx3_p8(poly8x8_t __p0, poly8x16x3_t __p1, uint8x8_t __p2) { 59254 poly8x8_t __ret; 59255 __ret = (poly8x8_t) __builtin_neon_vqtbx3_v((int8x8_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x16_t)__p1.val[2], (int8x8_t)__p2, 4); 59256 return __ret; 59257 } 59258 #else 59259 __ai __attribute__((target("neon"))) poly8x8_t vqtbx3_p8(poly8x8_t __p0, poly8x16x3_t __p1, uint8x8_t __p2) { 59260 poly8x8_t __ret; 59261 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 59262 poly8x16x3_t __rev1; 59263 __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59264 __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59265 __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59266 uint8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 59267 __ret = (poly8x8_t) __builtin_neon_vqtbx3_v((int8x8_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x8_t)__rev2, 4); 59268 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 59269 return __ret; 59270 } 59271 #endif 59272 59273 #ifdef __LITTLE_ENDIAN__ 59274 __ai __attribute__((target("neon"))) poly8x16_t vqtbx3q_p8(poly8x16_t __p0, poly8x16x3_t __p1, uint8x16_t __p2) { 59275 poly8x16_t __ret; 59276 __ret = (poly8x16_t) __builtin_neon_vqtbx3q_v((int8x16_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x16_t)__p1.val[2], (int8x16_t)__p2, 36); 59277 return __ret; 59278 } 59279 #else 59280 __ai __attribute__((target("neon"))) poly8x16_t vqtbx3q_p8(poly8x16_t __p0, poly8x16x3_t __p1, uint8x16_t __p2) { 59281 poly8x16_t __ret; 59282 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59283 poly8x16x3_t __rev1; 59284 __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59285 __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59286 __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59287 uint8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59288 __ret = (poly8x16_t) __builtin_neon_vqtbx3q_v((int8x16_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev2, 36); 59289 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59290 return __ret; 59291 } 59292 #endif 59293 59294 #ifdef __LITTLE_ENDIAN__ 59295 __ai __attribute__((target("neon"))) uint8x16_t vqtbx3q_u8(uint8x16_t __p0, uint8x16x3_t __p1, uint8x16_t __p2) { 59296 uint8x16_t __ret; 59297 __ret = (uint8x16_t) __builtin_neon_vqtbx3q_v((int8x16_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x16_t)__p1.val[2], (int8x16_t)__p2, 48); 59298 return __ret; 59299 } 59300 #else 59301 __ai __attribute__((target("neon"))) uint8x16_t vqtbx3q_u8(uint8x16_t __p0, uint8x16x3_t __p1, uint8x16_t __p2) { 59302 uint8x16_t __ret; 59303 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59304 uint8x16x3_t __rev1; 59305 __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59306 __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59307 __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59308 uint8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59309 __ret = (uint8x16_t) __builtin_neon_vqtbx3q_v((int8x16_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev2, 48); 59310 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59311 return __ret; 59312 } 59313 #endif 59314 59315 #ifdef __LITTLE_ENDIAN__ 59316 __ai __attribute__((target("neon"))) int8x16_t vqtbx3q_s8(int8x16_t __p0, int8x16x3_t __p1, uint8x16_t __p2) { 59317 int8x16_t __ret; 59318 __ret = (int8x16_t) __builtin_neon_vqtbx3q_v((int8x16_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x16_t)__p1.val[2], (int8x16_t)__p2, 32); 59319 return __ret; 59320 } 59321 #else 59322 __ai __attribute__((target("neon"))) int8x16_t vqtbx3q_s8(int8x16_t __p0, int8x16x3_t __p1, uint8x16_t __p2) { 59323 int8x16_t __ret; 59324 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59325 int8x16x3_t __rev1; 59326 __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59327 __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59328 __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59329 uint8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59330 __ret = (int8x16_t) __builtin_neon_vqtbx3q_v((int8x16_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev2, 32); 59331 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59332 return __ret; 59333 } 59334 #endif 59335 59336 #ifdef __LITTLE_ENDIAN__ 59337 __ai __attribute__((target("neon"))) uint8x8_t vqtbx3_u8(uint8x8_t __p0, uint8x16x3_t __p1, uint8x8_t __p2) { 59338 uint8x8_t __ret; 59339 __ret = (uint8x8_t) __builtin_neon_vqtbx3_v((int8x8_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x16_t)__p1.val[2], (int8x8_t)__p2, 16); 59340 return __ret; 59341 } 59342 #else 59343 __ai __attribute__((target("neon"))) uint8x8_t vqtbx3_u8(uint8x8_t __p0, uint8x16x3_t __p1, uint8x8_t __p2) { 59344 uint8x8_t __ret; 59345 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 59346 uint8x16x3_t __rev1; 59347 __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59348 __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59349 __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59350 uint8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 59351 __ret = (uint8x8_t) __builtin_neon_vqtbx3_v((int8x8_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x8_t)__rev2, 16); 59352 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 59353 return __ret; 59354 } 59355 #endif 59356 59357 #ifdef __LITTLE_ENDIAN__ 59358 __ai __attribute__((target("neon"))) int8x8_t vqtbx3_s8(int8x8_t __p0, int8x16x3_t __p1, uint8x8_t __p2) { 59359 int8x8_t __ret; 59360 __ret = (int8x8_t) __builtin_neon_vqtbx3_v((int8x8_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x16_t)__p1.val[2], (int8x8_t)__p2, 0); 59361 return __ret; 59362 } 59363 #else 59364 __ai __attribute__((target("neon"))) int8x8_t vqtbx3_s8(int8x8_t __p0, int8x16x3_t __p1, uint8x8_t __p2) { 59365 int8x8_t __ret; 59366 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 59367 int8x16x3_t __rev1; 59368 __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59369 __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59370 __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59371 uint8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 59372 __ret = (int8x8_t) __builtin_neon_vqtbx3_v((int8x8_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x8_t)__rev2, 0); 59373 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 59374 return __ret; 59375 } 59376 #endif 59377 59378 #ifdef __LITTLE_ENDIAN__ 59379 __ai __attribute__((target("neon"))) poly8x8_t vqtbx4_p8(poly8x8_t __p0, poly8x16x4_t __p1, uint8x8_t __p2) { 59380 poly8x8_t __ret; 59381 __ret = (poly8x8_t) __builtin_neon_vqtbx4_v((int8x8_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x16_t)__p1.val[2], (int8x16_t)__p1.val[3], (int8x8_t)__p2, 4); 59382 return __ret; 59383 } 59384 #else 59385 __ai __attribute__((target("neon"))) poly8x8_t vqtbx4_p8(poly8x8_t __p0, poly8x16x4_t __p1, uint8x8_t __p2) { 59386 poly8x8_t __ret; 59387 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 59388 poly8x16x4_t __rev1; 59389 __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59390 __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59391 __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59392 __rev1.val[3] = __builtin_shufflevector(__p1.val[3], __p1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59393 uint8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 59394 __ret = (poly8x8_t) __builtin_neon_vqtbx4_v((int8x8_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], (int8x8_t)__rev2, 4); 59395 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 59396 return __ret; 59397 } 59398 #endif 59399 59400 #ifdef __LITTLE_ENDIAN__ 59401 __ai __attribute__((target("neon"))) poly8x16_t vqtbx4q_p8(poly8x16_t __p0, poly8x16x4_t __p1, uint8x16_t __p2) { 59402 poly8x16_t __ret; 59403 __ret = (poly8x16_t) __builtin_neon_vqtbx4q_v((int8x16_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x16_t)__p1.val[2], (int8x16_t)__p1.val[3], (int8x16_t)__p2, 36); 59404 return __ret; 59405 } 59406 #else 59407 __ai __attribute__((target("neon"))) poly8x16_t vqtbx4q_p8(poly8x16_t __p0, poly8x16x4_t __p1, uint8x16_t __p2) { 59408 poly8x16_t __ret; 59409 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59410 poly8x16x4_t __rev1; 59411 __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59412 __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59413 __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59414 __rev1.val[3] = __builtin_shufflevector(__p1.val[3], __p1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59415 uint8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59416 __ret = (poly8x16_t) __builtin_neon_vqtbx4q_v((int8x16_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], (int8x16_t)__rev2, 36); 59417 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59418 return __ret; 59419 } 59420 #endif 59421 59422 #ifdef __LITTLE_ENDIAN__ 59423 __ai __attribute__((target("neon"))) uint8x16_t vqtbx4q_u8(uint8x16_t __p0, uint8x16x4_t __p1, uint8x16_t __p2) { 59424 uint8x16_t __ret; 59425 __ret = (uint8x16_t) __builtin_neon_vqtbx4q_v((int8x16_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x16_t)__p1.val[2], (int8x16_t)__p1.val[3], (int8x16_t)__p2, 48); 59426 return __ret; 59427 } 59428 #else 59429 __ai __attribute__((target("neon"))) uint8x16_t vqtbx4q_u8(uint8x16_t __p0, uint8x16x4_t __p1, uint8x16_t __p2) { 59430 uint8x16_t __ret; 59431 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59432 uint8x16x4_t __rev1; 59433 __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59434 __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59435 __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59436 __rev1.val[3] = __builtin_shufflevector(__p1.val[3], __p1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59437 uint8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59438 __ret = (uint8x16_t) __builtin_neon_vqtbx4q_v((int8x16_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], (int8x16_t)__rev2, 48); 59439 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59440 return __ret; 59441 } 59442 #endif 59443 59444 #ifdef __LITTLE_ENDIAN__ 59445 __ai __attribute__((target("neon"))) int8x16_t vqtbx4q_s8(int8x16_t __p0, int8x16x4_t __p1, uint8x16_t __p2) { 59446 int8x16_t __ret; 59447 __ret = (int8x16_t) __builtin_neon_vqtbx4q_v((int8x16_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x16_t)__p1.val[2], (int8x16_t)__p1.val[3], (int8x16_t)__p2, 32); 59448 return __ret; 59449 } 59450 #else 59451 __ai __attribute__((target("neon"))) int8x16_t vqtbx4q_s8(int8x16_t __p0, int8x16x4_t __p1, uint8x16_t __p2) { 59452 int8x16_t __ret; 59453 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59454 int8x16x4_t __rev1; 59455 __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59456 __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59457 __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59458 __rev1.val[3] = __builtin_shufflevector(__p1.val[3], __p1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59459 uint8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59460 __ret = (int8x16_t) __builtin_neon_vqtbx4q_v((int8x16_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], (int8x16_t)__rev2, 32); 59461 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59462 return __ret; 59463 } 59464 #endif 59465 59466 #ifdef __LITTLE_ENDIAN__ 59467 __ai __attribute__((target("neon"))) uint8x8_t vqtbx4_u8(uint8x8_t __p0, uint8x16x4_t __p1, uint8x8_t __p2) { 59468 uint8x8_t __ret; 59469 __ret = (uint8x8_t) __builtin_neon_vqtbx4_v((int8x8_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x16_t)__p1.val[2], (int8x16_t)__p1.val[3], (int8x8_t)__p2, 16); 59470 return __ret; 59471 } 59472 #else 59473 __ai __attribute__((target("neon"))) uint8x8_t vqtbx4_u8(uint8x8_t __p0, uint8x16x4_t __p1, uint8x8_t __p2) { 59474 uint8x8_t __ret; 59475 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 59476 uint8x16x4_t __rev1; 59477 __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59478 __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59479 __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59480 __rev1.val[3] = __builtin_shufflevector(__p1.val[3], __p1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59481 uint8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 59482 __ret = (uint8x8_t) __builtin_neon_vqtbx4_v((int8x8_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], (int8x8_t)__rev2, 16); 59483 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 59484 return __ret; 59485 } 59486 #endif 59487 59488 #ifdef __LITTLE_ENDIAN__ 59489 __ai __attribute__((target("neon"))) int8x8_t vqtbx4_s8(int8x8_t __p0, int8x16x4_t __p1, uint8x8_t __p2) { 59490 int8x8_t __ret; 59491 __ret = (int8x8_t) __builtin_neon_vqtbx4_v((int8x8_t)__p0, (int8x16_t)__p1.val[0], (int8x16_t)__p1.val[1], (int8x16_t)__p1.val[2], (int8x16_t)__p1.val[3], (int8x8_t)__p2, 0); 59492 return __ret; 59493 } 59494 #else 59495 __ai __attribute__((target("neon"))) int8x8_t vqtbx4_s8(int8x8_t __p0, int8x16x4_t __p1, uint8x8_t __p2) { 59496 int8x8_t __ret; 59497 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 59498 int8x16x4_t __rev1; 59499 __rev1.val[0] = __builtin_shufflevector(__p1.val[0], __p1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59500 __rev1.val[1] = __builtin_shufflevector(__p1.val[1], __p1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59501 __rev1.val[2] = __builtin_shufflevector(__p1.val[2], __p1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59502 __rev1.val[3] = __builtin_shufflevector(__p1.val[3], __p1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59503 uint8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 59504 __ret = (int8x8_t) __builtin_neon_vqtbx4_v((int8x8_t)__rev0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], (int8x8_t)__rev2, 0); 59505 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 59506 return __ret; 59507 } 59508 #endif 59509 59510 #ifdef __LITTLE_ENDIAN__ 59511 __ai __attribute__((target("neon"))) uint16x8_t vraddhn_high_u32(uint16x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 59512 uint16x8_t __ret; 59513 __ret = vcombine_u16(__p0, vraddhn_u32(__p1, __p2)); 59514 return __ret; 59515 } 59516 #else 59517 __ai __attribute__((target("neon"))) uint16x8_t vraddhn_high_u32(uint16x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 59518 uint16x8_t __ret; 59519 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 59520 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 59521 uint32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 59522 __ret = __noswap_vcombine_u16(__rev0, __noswap_vraddhn_u32(__rev1, __rev2)); 59523 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 59524 return __ret; 59525 } 59526 #endif 59527 59528 #ifdef __LITTLE_ENDIAN__ 59529 __ai __attribute__((target("neon"))) uint32x4_t vraddhn_high_u64(uint32x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) { 59530 uint32x4_t __ret; 59531 __ret = vcombine_u32(__p0, vraddhn_u64(__p1, __p2)); 59532 return __ret; 59533 } 59534 #else 59535 __ai __attribute__((target("neon"))) uint32x4_t vraddhn_high_u64(uint32x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) { 59536 uint32x4_t __ret; 59537 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 59538 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 59539 uint64x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 59540 __ret = __noswap_vcombine_u32(__rev0, __noswap_vraddhn_u64(__rev1, __rev2)); 59541 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 59542 return __ret; 59543 } 59544 #endif 59545 59546 #ifdef __LITTLE_ENDIAN__ 59547 __ai __attribute__((target("neon"))) uint8x16_t vraddhn_high_u16(uint8x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) { 59548 uint8x16_t __ret; 59549 __ret = vcombine_u8(__p0, vraddhn_u16(__p1, __p2)); 59550 return __ret; 59551 } 59552 #else 59553 __ai __attribute__((target("neon"))) uint8x16_t vraddhn_high_u16(uint8x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) { 59554 uint8x16_t __ret; 59555 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 59556 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 59557 uint16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 59558 __ret = __noswap_vcombine_u8(__rev0, __noswap_vraddhn_u16(__rev1, __rev2)); 59559 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59560 return __ret; 59561 } 59562 #endif 59563 59564 #ifdef __LITTLE_ENDIAN__ 59565 __ai __attribute__((target("neon"))) int16x8_t vraddhn_high_s32(int16x4_t __p0, int32x4_t __p1, int32x4_t __p2) { 59566 int16x8_t __ret; 59567 __ret = vcombine_s16(__p0, vraddhn_s32(__p1, __p2)); 59568 return __ret; 59569 } 59570 #else 59571 __ai __attribute__((target("neon"))) int16x8_t vraddhn_high_s32(int16x4_t __p0, int32x4_t __p1, int32x4_t __p2) { 59572 int16x8_t __ret; 59573 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 59574 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 59575 int32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 59576 __ret = __noswap_vcombine_s16(__rev0, __noswap_vraddhn_s32(__rev1, __rev2)); 59577 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 59578 return __ret; 59579 } 59580 #endif 59581 59582 #ifdef __LITTLE_ENDIAN__ 59583 __ai __attribute__((target("neon"))) int32x4_t vraddhn_high_s64(int32x2_t __p0, int64x2_t __p1, int64x2_t __p2) { 59584 int32x4_t __ret; 59585 __ret = vcombine_s32(__p0, vraddhn_s64(__p1, __p2)); 59586 return __ret; 59587 } 59588 #else 59589 __ai __attribute__((target("neon"))) int32x4_t vraddhn_high_s64(int32x2_t __p0, int64x2_t __p1, int64x2_t __p2) { 59590 int32x4_t __ret; 59591 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 59592 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 59593 int64x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 59594 __ret = __noswap_vcombine_s32(__rev0, __noswap_vraddhn_s64(__rev1, __rev2)); 59595 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 59596 return __ret; 59597 } 59598 #endif 59599 59600 #ifdef __LITTLE_ENDIAN__ 59601 __ai __attribute__((target("neon"))) int8x16_t vraddhn_high_s16(int8x8_t __p0, int16x8_t __p1, int16x8_t __p2) { 59602 int8x16_t __ret; 59603 __ret = vcombine_s8(__p0, vraddhn_s16(__p1, __p2)); 59604 return __ret; 59605 } 59606 #else 59607 __ai __attribute__((target("neon"))) int8x16_t vraddhn_high_s16(int8x8_t __p0, int16x8_t __p1, int16x8_t __p2) { 59608 int8x16_t __ret; 59609 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 59610 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 59611 int16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 59612 __ret = __noswap_vcombine_s8(__rev0, __noswap_vraddhn_s16(__rev1, __rev2)); 59613 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59614 return __ret; 59615 } 59616 #endif 59617 59618 #ifdef __LITTLE_ENDIAN__ 59619 __ai __attribute__((target("neon"))) poly8x8_t vrbit_p8(poly8x8_t __p0) { 59620 poly8x8_t __ret; 59621 __ret = (poly8x8_t) __builtin_neon_vrbit_v((int8x8_t)__p0, 4); 59622 return __ret; 59623 } 59624 #else 59625 __ai __attribute__((target("neon"))) poly8x8_t vrbit_p8(poly8x8_t __p0) { 59626 poly8x8_t __ret; 59627 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 59628 __ret = (poly8x8_t) __builtin_neon_vrbit_v((int8x8_t)__rev0, 4); 59629 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 59630 return __ret; 59631 } 59632 #endif 59633 59634 #ifdef __LITTLE_ENDIAN__ 59635 __ai __attribute__((target("neon"))) poly8x16_t vrbitq_p8(poly8x16_t __p0) { 59636 poly8x16_t __ret; 59637 __ret = (poly8x16_t) __builtin_neon_vrbitq_v((int8x16_t)__p0, 36); 59638 return __ret; 59639 } 59640 #else 59641 __ai __attribute__((target("neon"))) poly8x16_t vrbitq_p8(poly8x16_t __p0) { 59642 poly8x16_t __ret; 59643 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59644 __ret = (poly8x16_t) __builtin_neon_vrbitq_v((int8x16_t)__rev0, 36); 59645 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59646 return __ret; 59647 } 59648 #endif 59649 59650 #ifdef __LITTLE_ENDIAN__ 59651 __ai __attribute__((target("neon"))) uint8x16_t vrbitq_u8(uint8x16_t __p0) { 59652 uint8x16_t __ret; 59653 __ret = (uint8x16_t) __builtin_neon_vrbitq_v((int8x16_t)__p0, 48); 59654 return __ret; 59655 } 59656 #else 59657 __ai __attribute__((target("neon"))) uint8x16_t vrbitq_u8(uint8x16_t __p0) { 59658 uint8x16_t __ret; 59659 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59660 __ret = (uint8x16_t) __builtin_neon_vrbitq_v((int8x16_t)__rev0, 48); 59661 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59662 return __ret; 59663 } 59664 #endif 59665 59666 #ifdef __LITTLE_ENDIAN__ 59667 __ai __attribute__((target("neon"))) int8x16_t vrbitq_s8(int8x16_t __p0) { 59668 int8x16_t __ret; 59669 __ret = (int8x16_t) __builtin_neon_vrbitq_v((int8x16_t)__p0, 32); 59670 return __ret; 59671 } 59672 #else 59673 __ai __attribute__((target("neon"))) int8x16_t vrbitq_s8(int8x16_t __p0) { 59674 int8x16_t __ret; 59675 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59676 __ret = (int8x16_t) __builtin_neon_vrbitq_v((int8x16_t)__rev0, 32); 59677 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 59678 return __ret; 59679 } 59680 #endif 59681 59682 #ifdef __LITTLE_ENDIAN__ 59683 __ai __attribute__((target("neon"))) uint8x8_t vrbit_u8(uint8x8_t __p0) { 59684 uint8x8_t __ret; 59685 __ret = (uint8x8_t) __builtin_neon_vrbit_v((int8x8_t)__p0, 16); 59686 return __ret; 59687 } 59688 #else 59689 __ai __attribute__((target("neon"))) uint8x8_t vrbit_u8(uint8x8_t __p0) { 59690 uint8x8_t __ret; 59691 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 59692 __ret = (uint8x8_t) __builtin_neon_vrbit_v((int8x8_t)__rev0, 16); 59693 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 59694 return __ret; 59695 } 59696 #endif 59697 59698 #ifdef __LITTLE_ENDIAN__ 59699 __ai __attribute__((target("neon"))) int8x8_t vrbit_s8(int8x8_t __p0) { 59700 int8x8_t __ret; 59701 __ret = (int8x8_t) __builtin_neon_vrbit_v((int8x8_t)__p0, 0); 59702 return __ret; 59703 } 59704 #else 59705 __ai __attribute__((target("neon"))) int8x8_t vrbit_s8(int8x8_t __p0) { 59706 int8x8_t __ret; 59707 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 59708 __ret = (int8x8_t) __builtin_neon_vrbit_v((int8x8_t)__rev0, 0); 59709 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 59710 return __ret; 59711 } 59712 #endif 59713 59714 #ifdef __LITTLE_ENDIAN__ 59715 __ai __attribute__((target("neon"))) float64x2_t vrecpeq_f64(float64x2_t __p0) { 59716 float64x2_t __ret; 59717 __ret = (float64x2_t) __builtin_neon_vrecpeq_v((int8x16_t)__p0, 42); 59718 return __ret; 59719 } 59720 #else 59721 __ai __attribute__((target("neon"))) float64x2_t vrecpeq_f64(float64x2_t __p0) { 59722 float64x2_t __ret; 59723 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 59724 __ret = (float64x2_t) __builtin_neon_vrecpeq_v((int8x16_t)__rev0, 42); 59725 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 59726 return __ret; 59727 } 59728 #endif 59729 59730 __ai __attribute__((target("neon"))) float64x1_t vrecpe_f64(float64x1_t __p0) { 59731 float64x1_t __ret; 59732 __ret = (float64x1_t) __builtin_neon_vrecpe_v((int8x8_t)__p0, 10); 59733 return __ret; 59734 } 59735 __ai __attribute__((target("neon"))) float64_t vrecped_f64(float64_t __p0) { 59736 float64_t __ret; 59737 __ret = (float64_t) __builtin_neon_vrecped_f64(__p0); 59738 return __ret; 59739 } 59740 __ai __attribute__((target("neon"))) float32_t vrecpes_f32(float32_t __p0) { 59741 float32_t __ret; 59742 __ret = (float32_t) __builtin_neon_vrecpes_f32(__p0); 59743 return __ret; 59744 } 59745 #ifdef __LITTLE_ENDIAN__ 59746 __ai __attribute__((target("neon"))) float64x2_t vrecpsq_f64(float64x2_t __p0, float64x2_t __p1) { 59747 float64x2_t __ret; 59748 __ret = (float64x2_t) __builtin_neon_vrecpsq_v((int8x16_t)__p0, (int8x16_t)__p1, 42); 59749 return __ret; 59750 } 59751 #else 59752 __ai __attribute__((target("neon"))) float64x2_t vrecpsq_f64(float64x2_t __p0, float64x2_t __p1) { 59753 float64x2_t __ret; 59754 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 59755 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 59756 __ret = (float64x2_t) __builtin_neon_vrecpsq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 42); 59757 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 59758 return __ret; 59759 } 59760 #endif 59761 59762 __ai __attribute__((target("neon"))) float64x1_t vrecps_f64(float64x1_t __p0, float64x1_t __p1) { 59763 float64x1_t __ret; 59764 __ret = (float64x1_t) __builtin_neon_vrecps_v((int8x8_t)__p0, (int8x8_t)__p1, 10); 59765 return __ret; 59766 } 59767 __ai __attribute__((target("neon"))) float64_t vrecpsd_f64(float64_t __p0, float64_t __p1) { 59768 float64_t __ret; 59769 __ret = (float64_t) __builtin_neon_vrecpsd_f64(__p0, __p1); 59770 return __ret; 59771 } 59772 __ai __attribute__((target("neon"))) float32_t vrecpss_f32(float32_t __p0, float32_t __p1) { 59773 float32_t __ret; 59774 __ret = (float32_t) __builtin_neon_vrecpss_f32(__p0, __p1); 59775 return __ret; 59776 } 59777 __ai __attribute__((target("neon"))) float64_t vrecpxd_f64(float64_t __p0) { 59778 float64_t __ret; 59779 __ret = (float64_t) __builtin_neon_vrecpxd_f64(__p0); 59780 return __ret; 59781 } 59782 __ai __attribute__((target("neon"))) float32_t vrecpxs_f32(float32_t __p0) { 59783 float32_t __ret; 59784 __ret = (float32_t) __builtin_neon_vrecpxs_f32(__p0); 59785 return __ret; 59786 } 59787 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_p64(poly64x1_t __p0) { 59788 poly8x8_t __ret; 59789 __ret = (poly8x8_t)(__p0); 59790 return __ret; 59791 } 59792 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_p16(poly16x4_t __p0) { 59793 poly8x8_t __ret; 59794 __ret = (poly8x8_t)(__p0); 59795 return __ret; 59796 } 59797 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_u8(uint8x8_t __p0) { 59798 poly8x8_t __ret; 59799 __ret = (poly8x8_t)(__p0); 59800 return __ret; 59801 } 59802 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_u32(uint32x2_t __p0) { 59803 poly8x8_t __ret; 59804 __ret = (poly8x8_t)(__p0); 59805 return __ret; 59806 } 59807 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_u64(uint64x1_t __p0) { 59808 poly8x8_t __ret; 59809 __ret = (poly8x8_t)(__p0); 59810 return __ret; 59811 } 59812 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_u16(uint16x4_t __p0) { 59813 poly8x8_t __ret; 59814 __ret = (poly8x8_t)(__p0); 59815 return __ret; 59816 } 59817 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_s8(int8x8_t __p0) { 59818 poly8x8_t __ret; 59819 __ret = (poly8x8_t)(__p0); 59820 return __ret; 59821 } 59822 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_f64(float64x1_t __p0) { 59823 poly8x8_t __ret; 59824 __ret = (poly8x8_t)(__p0); 59825 return __ret; 59826 } 59827 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_f32(float32x2_t __p0) { 59828 poly8x8_t __ret; 59829 __ret = (poly8x8_t)(__p0); 59830 return __ret; 59831 } 59832 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_f16(float16x4_t __p0) { 59833 poly8x8_t __ret; 59834 __ret = (poly8x8_t)(__p0); 59835 return __ret; 59836 } 59837 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_s32(int32x2_t __p0) { 59838 poly8x8_t __ret; 59839 __ret = (poly8x8_t)(__p0); 59840 return __ret; 59841 } 59842 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_s64(int64x1_t __p0) { 59843 poly8x8_t __ret; 59844 __ret = (poly8x8_t)(__p0); 59845 return __ret; 59846 } 59847 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_mf8(mfloat8x8_t __p0) { 59848 poly8x8_t __ret; 59849 __ret = (poly8x8_t)(__p0); 59850 return __ret; 59851 } 59852 __ai __attribute__((target("neon"))) poly8x8_t vreinterpret_p8_s16(int16x4_t __p0) { 59853 poly8x8_t __ret; 59854 __ret = (poly8x8_t)(__p0); 59855 return __ret; 59856 } 59857 __ai __attribute__((target("neon"))) poly64x1_t vreinterpret_p64_p8(poly8x8_t __p0) { 59858 poly64x1_t __ret; 59859 __ret = (poly64x1_t)(__p0); 59860 return __ret; 59861 } 59862 __ai __attribute__((target("neon"))) poly64x1_t vreinterpret_p64_p16(poly16x4_t __p0) { 59863 poly64x1_t __ret; 59864 __ret = (poly64x1_t)(__p0); 59865 return __ret; 59866 } 59867 __ai __attribute__((target("neon"))) poly64x1_t vreinterpret_p64_u8(uint8x8_t __p0) { 59868 poly64x1_t __ret; 59869 __ret = (poly64x1_t)(__p0); 59870 return __ret; 59871 } 59872 __ai __attribute__((target("neon"))) poly64x1_t vreinterpret_p64_u32(uint32x2_t __p0) { 59873 poly64x1_t __ret; 59874 __ret = (poly64x1_t)(__p0); 59875 return __ret; 59876 } 59877 __ai __attribute__((target("neon"))) poly64x1_t vreinterpret_p64_u64(uint64x1_t __p0) { 59878 poly64x1_t __ret; 59879 __ret = (poly64x1_t)(__p0); 59880 return __ret; 59881 } 59882 __ai __attribute__((target("neon"))) poly64x1_t vreinterpret_p64_u16(uint16x4_t __p0) { 59883 poly64x1_t __ret; 59884 __ret = (poly64x1_t)(__p0); 59885 return __ret; 59886 } 59887 __ai __attribute__((target("neon"))) poly64x1_t vreinterpret_p64_s8(int8x8_t __p0) { 59888 poly64x1_t __ret; 59889 __ret = (poly64x1_t)(__p0); 59890 return __ret; 59891 } 59892 __ai __attribute__((target("neon"))) poly64x1_t vreinterpret_p64_f64(float64x1_t __p0) { 59893 poly64x1_t __ret; 59894 __ret = (poly64x1_t)(__p0); 59895 return __ret; 59896 } 59897 __ai __attribute__((target("neon"))) poly64x1_t vreinterpret_p64_f32(float32x2_t __p0) { 59898 poly64x1_t __ret; 59899 __ret = (poly64x1_t)(__p0); 59900 return __ret; 59901 } 59902 __ai __attribute__((target("neon"))) poly64x1_t vreinterpret_p64_f16(float16x4_t __p0) { 59903 poly64x1_t __ret; 59904 __ret = (poly64x1_t)(__p0); 59905 return __ret; 59906 } 59907 __ai __attribute__((target("neon"))) poly64x1_t vreinterpret_p64_s32(int32x2_t __p0) { 59908 poly64x1_t __ret; 59909 __ret = (poly64x1_t)(__p0); 59910 return __ret; 59911 } 59912 __ai __attribute__((target("neon"))) poly64x1_t vreinterpret_p64_s64(int64x1_t __p0) { 59913 poly64x1_t __ret; 59914 __ret = (poly64x1_t)(__p0); 59915 return __ret; 59916 } 59917 __ai __attribute__((target("neon"))) poly64x1_t vreinterpret_p64_mf8(mfloat8x8_t __p0) { 59918 poly64x1_t __ret; 59919 __ret = (poly64x1_t)(__p0); 59920 return __ret; 59921 } 59922 __ai __attribute__((target("neon"))) poly64x1_t vreinterpret_p64_s16(int16x4_t __p0) { 59923 poly64x1_t __ret; 59924 __ret = (poly64x1_t)(__p0); 59925 return __ret; 59926 } 59927 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_p8(poly8x8_t __p0) { 59928 poly16x4_t __ret; 59929 __ret = (poly16x4_t)(__p0); 59930 return __ret; 59931 } 59932 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_p64(poly64x1_t __p0) { 59933 poly16x4_t __ret; 59934 __ret = (poly16x4_t)(__p0); 59935 return __ret; 59936 } 59937 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_u8(uint8x8_t __p0) { 59938 poly16x4_t __ret; 59939 __ret = (poly16x4_t)(__p0); 59940 return __ret; 59941 } 59942 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_u32(uint32x2_t __p0) { 59943 poly16x4_t __ret; 59944 __ret = (poly16x4_t)(__p0); 59945 return __ret; 59946 } 59947 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_u64(uint64x1_t __p0) { 59948 poly16x4_t __ret; 59949 __ret = (poly16x4_t)(__p0); 59950 return __ret; 59951 } 59952 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_u16(uint16x4_t __p0) { 59953 poly16x4_t __ret; 59954 __ret = (poly16x4_t)(__p0); 59955 return __ret; 59956 } 59957 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_s8(int8x8_t __p0) { 59958 poly16x4_t __ret; 59959 __ret = (poly16x4_t)(__p0); 59960 return __ret; 59961 } 59962 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_f64(float64x1_t __p0) { 59963 poly16x4_t __ret; 59964 __ret = (poly16x4_t)(__p0); 59965 return __ret; 59966 } 59967 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_f32(float32x2_t __p0) { 59968 poly16x4_t __ret; 59969 __ret = (poly16x4_t)(__p0); 59970 return __ret; 59971 } 59972 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_f16(float16x4_t __p0) { 59973 poly16x4_t __ret; 59974 __ret = (poly16x4_t)(__p0); 59975 return __ret; 59976 } 59977 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_s32(int32x2_t __p0) { 59978 poly16x4_t __ret; 59979 __ret = (poly16x4_t)(__p0); 59980 return __ret; 59981 } 59982 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_s64(int64x1_t __p0) { 59983 poly16x4_t __ret; 59984 __ret = (poly16x4_t)(__p0); 59985 return __ret; 59986 } 59987 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_mf8(mfloat8x8_t __p0) { 59988 poly16x4_t __ret; 59989 __ret = (poly16x4_t)(__p0); 59990 return __ret; 59991 } 59992 __ai __attribute__((target("neon"))) poly16x4_t vreinterpret_p16_s16(int16x4_t __p0) { 59993 poly16x4_t __ret; 59994 __ret = (poly16x4_t)(__p0); 59995 return __ret; 59996 } 59997 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_p128(poly128_t __p0) { 59998 poly8x16_t __ret; 59999 __ret = (poly8x16_t)(__p0); 60000 return __ret; 60001 } 60002 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_p64(poly64x2_t __p0) { 60003 poly8x16_t __ret; 60004 __ret = (poly8x16_t)(__p0); 60005 return __ret; 60006 } 60007 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_p16(poly16x8_t __p0) { 60008 poly8x16_t __ret; 60009 __ret = (poly8x16_t)(__p0); 60010 return __ret; 60011 } 60012 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_u8(uint8x16_t __p0) { 60013 poly8x16_t __ret; 60014 __ret = (poly8x16_t)(__p0); 60015 return __ret; 60016 } 60017 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_u32(uint32x4_t __p0) { 60018 poly8x16_t __ret; 60019 __ret = (poly8x16_t)(__p0); 60020 return __ret; 60021 } 60022 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_u64(uint64x2_t __p0) { 60023 poly8x16_t __ret; 60024 __ret = (poly8x16_t)(__p0); 60025 return __ret; 60026 } 60027 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_u16(uint16x8_t __p0) { 60028 poly8x16_t __ret; 60029 __ret = (poly8x16_t)(__p0); 60030 return __ret; 60031 } 60032 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_s8(int8x16_t __p0) { 60033 poly8x16_t __ret; 60034 __ret = (poly8x16_t)(__p0); 60035 return __ret; 60036 } 60037 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_f64(float64x2_t __p0) { 60038 poly8x16_t __ret; 60039 __ret = (poly8x16_t)(__p0); 60040 return __ret; 60041 } 60042 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_f32(float32x4_t __p0) { 60043 poly8x16_t __ret; 60044 __ret = (poly8x16_t)(__p0); 60045 return __ret; 60046 } 60047 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_f16(float16x8_t __p0) { 60048 poly8x16_t __ret; 60049 __ret = (poly8x16_t)(__p0); 60050 return __ret; 60051 } 60052 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_s32(int32x4_t __p0) { 60053 poly8x16_t __ret; 60054 __ret = (poly8x16_t)(__p0); 60055 return __ret; 60056 } 60057 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_s64(int64x2_t __p0) { 60058 poly8x16_t __ret; 60059 __ret = (poly8x16_t)(__p0); 60060 return __ret; 60061 } 60062 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_mf8(mfloat8x16_t __p0) { 60063 poly8x16_t __ret; 60064 __ret = (poly8x16_t)(__p0); 60065 return __ret; 60066 } 60067 __ai __attribute__((target("neon"))) poly8x16_t vreinterpretq_p8_s16(int16x8_t __p0) { 60068 poly8x16_t __ret; 60069 __ret = (poly8x16_t)(__p0); 60070 return __ret; 60071 } 60072 __ai __attribute__((target("neon"))) poly128_t vreinterpretq_p128_p8(poly8x16_t __p0) { 60073 poly128_t __ret; 60074 __ret = (poly128_t)(__p0); 60075 return __ret; 60076 } 60077 __ai __attribute__((target("neon"))) poly128_t vreinterpretq_p128_p64(poly64x2_t __p0) { 60078 poly128_t __ret; 60079 __ret = (poly128_t)(__p0); 60080 return __ret; 60081 } 60082 __ai __attribute__((target("neon"))) poly128_t vreinterpretq_p128_p16(poly16x8_t __p0) { 60083 poly128_t __ret; 60084 __ret = (poly128_t)(__p0); 60085 return __ret; 60086 } 60087 __ai __attribute__((target("neon"))) poly128_t vreinterpretq_p128_u8(uint8x16_t __p0) { 60088 poly128_t __ret; 60089 __ret = (poly128_t)(__p0); 60090 return __ret; 60091 } 60092 __ai __attribute__((target("neon"))) poly128_t vreinterpretq_p128_u32(uint32x4_t __p0) { 60093 poly128_t __ret; 60094 __ret = (poly128_t)(__p0); 60095 return __ret; 60096 } 60097 __ai __attribute__((target("neon"))) poly128_t vreinterpretq_p128_u64(uint64x2_t __p0) { 60098 poly128_t __ret; 60099 __ret = (poly128_t)(__p0); 60100 return __ret; 60101 } 60102 __ai __attribute__((target("neon"))) poly128_t vreinterpretq_p128_u16(uint16x8_t __p0) { 60103 poly128_t __ret; 60104 __ret = (poly128_t)(__p0); 60105 return __ret; 60106 } 60107 __ai __attribute__((target("neon"))) poly128_t vreinterpretq_p128_s8(int8x16_t __p0) { 60108 poly128_t __ret; 60109 __ret = (poly128_t)(__p0); 60110 return __ret; 60111 } 60112 __ai __attribute__((target("neon"))) poly128_t vreinterpretq_p128_f64(float64x2_t __p0) { 60113 poly128_t __ret; 60114 __ret = (poly128_t)(__p0); 60115 return __ret; 60116 } 60117 __ai __attribute__((target("neon"))) poly128_t vreinterpretq_p128_f32(float32x4_t __p0) { 60118 poly128_t __ret; 60119 __ret = (poly128_t)(__p0); 60120 return __ret; 60121 } 60122 __ai __attribute__((target("neon"))) poly128_t vreinterpretq_p128_f16(float16x8_t __p0) { 60123 poly128_t __ret; 60124 __ret = (poly128_t)(__p0); 60125 return __ret; 60126 } 60127 __ai __attribute__((target("neon"))) poly128_t vreinterpretq_p128_s32(int32x4_t __p0) { 60128 poly128_t __ret; 60129 __ret = (poly128_t)(__p0); 60130 return __ret; 60131 } 60132 __ai __attribute__((target("neon"))) poly128_t vreinterpretq_p128_s64(int64x2_t __p0) { 60133 poly128_t __ret; 60134 __ret = (poly128_t)(__p0); 60135 return __ret; 60136 } 60137 __ai __attribute__((target("neon"))) poly128_t vreinterpretq_p128_mf8(mfloat8x16_t __p0) { 60138 poly128_t __ret; 60139 __ret = (poly128_t)(__p0); 60140 return __ret; 60141 } 60142 __ai __attribute__((target("neon"))) poly128_t vreinterpretq_p128_s16(int16x8_t __p0) { 60143 poly128_t __ret; 60144 __ret = (poly128_t)(__p0); 60145 return __ret; 60146 } 60147 __ai __attribute__((target("neon"))) poly64x2_t vreinterpretq_p64_p8(poly8x16_t __p0) { 60148 poly64x2_t __ret; 60149 __ret = (poly64x2_t)(__p0); 60150 return __ret; 60151 } 60152 __ai __attribute__((target("neon"))) poly64x2_t vreinterpretq_p64_p128(poly128_t __p0) { 60153 poly64x2_t __ret; 60154 __ret = (poly64x2_t)(__p0); 60155 return __ret; 60156 } 60157 __ai __attribute__((target("neon"))) poly64x2_t vreinterpretq_p64_p16(poly16x8_t __p0) { 60158 poly64x2_t __ret; 60159 __ret = (poly64x2_t)(__p0); 60160 return __ret; 60161 } 60162 __ai __attribute__((target("neon"))) poly64x2_t vreinterpretq_p64_u8(uint8x16_t __p0) { 60163 poly64x2_t __ret; 60164 __ret = (poly64x2_t)(__p0); 60165 return __ret; 60166 } 60167 __ai __attribute__((target("neon"))) poly64x2_t vreinterpretq_p64_u32(uint32x4_t __p0) { 60168 poly64x2_t __ret; 60169 __ret = (poly64x2_t)(__p0); 60170 return __ret; 60171 } 60172 __ai __attribute__((target("neon"))) poly64x2_t vreinterpretq_p64_u64(uint64x2_t __p0) { 60173 poly64x2_t __ret; 60174 __ret = (poly64x2_t)(__p0); 60175 return __ret; 60176 } 60177 __ai __attribute__((target("neon"))) poly64x2_t vreinterpretq_p64_u16(uint16x8_t __p0) { 60178 poly64x2_t __ret; 60179 __ret = (poly64x2_t)(__p0); 60180 return __ret; 60181 } 60182 __ai __attribute__((target("neon"))) poly64x2_t vreinterpretq_p64_s8(int8x16_t __p0) { 60183 poly64x2_t __ret; 60184 __ret = (poly64x2_t)(__p0); 60185 return __ret; 60186 } 60187 __ai __attribute__((target("neon"))) poly64x2_t vreinterpretq_p64_f64(float64x2_t __p0) { 60188 poly64x2_t __ret; 60189 __ret = (poly64x2_t)(__p0); 60190 return __ret; 60191 } 60192 __ai __attribute__((target("neon"))) poly64x2_t vreinterpretq_p64_f32(float32x4_t __p0) { 60193 poly64x2_t __ret; 60194 __ret = (poly64x2_t)(__p0); 60195 return __ret; 60196 } 60197 __ai __attribute__((target("neon"))) poly64x2_t vreinterpretq_p64_f16(float16x8_t __p0) { 60198 poly64x2_t __ret; 60199 __ret = (poly64x2_t)(__p0); 60200 return __ret; 60201 } 60202 __ai __attribute__((target("neon"))) poly64x2_t vreinterpretq_p64_s32(int32x4_t __p0) { 60203 poly64x2_t __ret; 60204 __ret = (poly64x2_t)(__p0); 60205 return __ret; 60206 } 60207 __ai __attribute__((target("neon"))) poly64x2_t vreinterpretq_p64_s64(int64x2_t __p0) { 60208 poly64x2_t __ret; 60209 __ret = (poly64x2_t)(__p0); 60210 return __ret; 60211 } 60212 __ai __attribute__((target("neon"))) poly64x2_t vreinterpretq_p64_mf8(mfloat8x16_t __p0) { 60213 poly64x2_t __ret; 60214 __ret = (poly64x2_t)(__p0); 60215 return __ret; 60216 } 60217 __ai __attribute__((target("neon"))) poly64x2_t vreinterpretq_p64_s16(int16x8_t __p0) { 60218 poly64x2_t __ret; 60219 __ret = (poly64x2_t)(__p0); 60220 return __ret; 60221 } 60222 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_p8(poly8x16_t __p0) { 60223 poly16x8_t __ret; 60224 __ret = (poly16x8_t)(__p0); 60225 return __ret; 60226 } 60227 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_p128(poly128_t __p0) { 60228 poly16x8_t __ret; 60229 __ret = (poly16x8_t)(__p0); 60230 return __ret; 60231 } 60232 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_p64(poly64x2_t __p0) { 60233 poly16x8_t __ret; 60234 __ret = (poly16x8_t)(__p0); 60235 return __ret; 60236 } 60237 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_u8(uint8x16_t __p0) { 60238 poly16x8_t __ret; 60239 __ret = (poly16x8_t)(__p0); 60240 return __ret; 60241 } 60242 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_u32(uint32x4_t __p0) { 60243 poly16x8_t __ret; 60244 __ret = (poly16x8_t)(__p0); 60245 return __ret; 60246 } 60247 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_u64(uint64x2_t __p0) { 60248 poly16x8_t __ret; 60249 __ret = (poly16x8_t)(__p0); 60250 return __ret; 60251 } 60252 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_u16(uint16x8_t __p0) { 60253 poly16x8_t __ret; 60254 __ret = (poly16x8_t)(__p0); 60255 return __ret; 60256 } 60257 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_s8(int8x16_t __p0) { 60258 poly16x8_t __ret; 60259 __ret = (poly16x8_t)(__p0); 60260 return __ret; 60261 } 60262 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_f64(float64x2_t __p0) { 60263 poly16x8_t __ret; 60264 __ret = (poly16x8_t)(__p0); 60265 return __ret; 60266 } 60267 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_f32(float32x4_t __p0) { 60268 poly16x8_t __ret; 60269 __ret = (poly16x8_t)(__p0); 60270 return __ret; 60271 } 60272 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_f16(float16x8_t __p0) { 60273 poly16x8_t __ret; 60274 __ret = (poly16x8_t)(__p0); 60275 return __ret; 60276 } 60277 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_s32(int32x4_t __p0) { 60278 poly16x8_t __ret; 60279 __ret = (poly16x8_t)(__p0); 60280 return __ret; 60281 } 60282 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_s64(int64x2_t __p0) { 60283 poly16x8_t __ret; 60284 __ret = (poly16x8_t)(__p0); 60285 return __ret; 60286 } 60287 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_mf8(mfloat8x16_t __p0) { 60288 poly16x8_t __ret; 60289 __ret = (poly16x8_t)(__p0); 60290 return __ret; 60291 } 60292 __ai __attribute__((target("neon"))) poly16x8_t vreinterpretq_p16_s16(int16x8_t __p0) { 60293 poly16x8_t __ret; 60294 __ret = (poly16x8_t)(__p0); 60295 return __ret; 60296 } 60297 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_p8(poly8x16_t __p0) { 60298 uint8x16_t __ret; 60299 __ret = (uint8x16_t)(__p0); 60300 return __ret; 60301 } 60302 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_p128(poly128_t __p0) { 60303 uint8x16_t __ret; 60304 __ret = (uint8x16_t)(__p0); 60305 return __ret; 60306 } 60307 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_p64(poly64x2_t __p0) { 60308 uint8x16_t __ret; 60309 __ret = (uint8x16_t)(__p0); 60310 return __ret; 60311 } 60312 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_p16(poly16x8_t __p0) { 60313 uint8x16_t __ret; 60314 __ret = (uint8x16_t)(__p0); 60315 return __ret; 60316 } 60317 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_u32(uint32x4_t __p0) { 60318 uint8x16_t __ret; 60319 __ret = (uint8x16_t)(__p0); 60320 return __ret; 60321 } 60322 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_u64(uint64x2_t __p0) { 60323 uint8x16_t __ret; 60324 __ret = (uint8x16_t)(__p0); 60325 return __ret; 60326 } 60327 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_u16(uint16x8_t __p0) { 60328 uint8x16_t __ret; 60329 __ret = (uint8x16_t)(__p0); 60330 return __ret; 60331 } 60332 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_s8(int8x16_t __p0) { 60333 uint8x16_t __ret; 60334 __ret = (uint8x16_t)(__p0); 60335 return __ret; 60336 } 60337 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_f64(float64x2_t __p0) { 60338 uint8x16_t __ret; 60339 __ret = (uint8x16_t)(__p0); 60340 return __ret; 60341 } 60342 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_f32(float32x4_t __p0) { 60343 uint8x16_t __ret; 60344 __ret = (uint8x16_t)(__p0); 60345 return __ret; 60346 } 60347 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_f16(float16x8_t __p0) { 60348 uint8x16_t __ret; 60349 __ret = (uint8x16_t)(__p0); 60350 return __ret; 60351 } 60352 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_s32(int32x4_t __p0) { 60353 uint8x16_t __ret; 60354 __ret = (uint8x16_t)(__p0); 60355 return __ret; 60356 } 60357 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_s64(int64x2_t __p0) { 60358 uint8x16_t __ret; 60359 __ret = (uint8x16_t)(__p0); 60360 return __ret; 60361 } 60362 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_mf8(mfloat8x16_t __p0) { 60363 uint8x16_t __ret; 60364 __ret = (uint8x16_t)(__p0); 60365 return __ret; 60366 } 60367 __ai __attribute__((target("neon"))) uint8x16_t vreinterpretq_u8_s16(int16x8_t __p0) { 60368 uint8x16_t __ret; 60369 __ret = (uint8x16_t)(__p0); 60370 return __ret; 60371 } 60372 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_p8(poly8x16_t __p0) { 60373 uint32x4_t __ret; 60374 __ret = (uint32x4_t)(__p0); 60375 return __ret; 60376 } 60377 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_p128(poly128_t __p0) { 60378 uint32x4_t __ret; 60379 __ret = (uint32x4_t)(__p0); 60380 return __ret; 60381 } 60382 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_p64(poly64x2_t __p0) { 60383 uint32x4_t __ret; 60384 __ret = (uint32x4_t)(__p0); 60385 return __ret; 60386 } 60387 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_p16(poly16x8_t __p0) { 60388 uint32x4_t __ret; 60389 __ret = (uint32x4_t)(__p0); 60390 return __ret; 60391 } 60392 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_u8(uint8x16_t __p0) { 60393 uint32x4_t __ret; 60394 __ret = (uint32x4_t)(__p0); 60395 return __ret; 60396 } 60397 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_u64(uint64x2_t __p0) { 60398 uint32x4_t __ret; 60399 __ret = (uint32x4_t)(__p0); 60400 return __ret; 60401 } 60402 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_u16(uint16x8_t __p0) { 60403 uint32x4_t __ret; 60404 __ret = (uint32x4_t)(__p0); 60405 return __ret; 60406 } 60407 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_s8(int8x16_t __p0) { 60408 uint32x4_t __ret; 60409 __ret = (uint32x4_t)(__p0); 60410 return __ret; 60411 } 60412 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_f64(float64x2_t __p0) { 60413 uint32x4_t __ret; 60414 __ret = (uint32x4_t)(__p0); 60415 return __ret; 60416 } 60417 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_f32(float32x4_t __p0) { 60418 uint32x4_t __ret; 60419 __ret = (uint32x4_t)(__p0); 60420 return __ret; 60421 } 60422 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_f16(float16x8_t __p0) { 60423 uint32x4_t __ret; 60424 __ret = (uint32x4_t)(__p0); 60425 return __ret; 60426 } 60427 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_s32(int32x4_t __p0) { 60428 uint32x4_t __ret; 60429 __ret = (uint32x4_t)(__p0); 60430 return __ret; 60431 } 60432 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_s64(int64x2_t __p0) { 60433 uint32x4_t __ret; 60434 __ret = (uint32x4_t)(__p0); 60435 return __ret; 60436 } 60437 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_mf8(mfloat8x16_t __p0) { 60438 uint32x4_t __ret; 60439 __ret = (uint32x4_t)(__p0); 60440 return __ret; 60441 } 60442 __ai __attribute__((target("neon"))) uint32x4_t vreinterpretq_u32_s16(int16x8_t __p0) { 60443 uint32x4_t __ret; 60444 __ret = (uint32x4_t)(__p0); 60445 return __ret; 60446 } 60447 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_p8(poly8x16_t __p0) { 60448 uint64x2_t __ret; 60449 __ret = (uint64x2_t)(__p0); 60450 return __ret; 60451 } 60452 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_p128(poly128_t __p0) { 60453 uint64x2_t __ret; 60454 __ret = (uint64x2_t)(__p0); 60455 return __ret; 60456 } 60457 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_p64(poly64x2_t __p0) { 60458 uint64x2_t __ret; 60459 __ret = (uint64x2_t)(__p0); 60460 return __ret; 60461 } 60462 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_p16(poly16x8_t __p0) { 60463 uint64x2_t __ret; 60464 __ret = (uint64x2_t)(__p0); 60465 return __ret; 60466 } 60467 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_u8(uint8x16_t __p0) { 60468 uint64x2_t __ret; 60469 __ret = (uint64x2_t)(__p0); 60470 return __ret; 60471 } 60472 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_u32(uint32x4_t __p0) { 60473 uint64x2_t __ret; 60474 __ret = (uint64x2_t)(__p0); 60475 return __ret; 60476 } 60477 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_u16(uint16x8_t __p0) { 60478 uint64x2_t __ret; 60479 __ret = (uint64x2_t)(__p0); 60480 return __ret; 60481 } 60482 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_s8(int8x16_t __p0) { 60483 uint64x2_t __ret; 60484 __ret = (uint64x2_t)(__p0); 60485 return __ret; 60486 } 60487 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_f64(float64x2_t __p0) { 60488 uint64x2_t __ret; 60489 __ret = (uint64x2_t)(__p0); 60490 return __ret; 60491 } 60492 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_f32(float32x4_t __p0) { 60493 uint64x2_t __ret; 60494 __ret = (uint64x2_t)(__p0); 60495 return __ret; 60496 } 60497 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_f16(float16x8_t __p0) { 60498 uint64x2_t __ret; 60499 __ret = (uint64x2_t)(__p0); 60500 return __ret; 60501 } 60502 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_s32(int32x4_t __p0) { 60503 uint64x2_t __ret; 60504 __ret = (uint64x2_t)(__p0); 60505 return __ret; 60506 } 60507 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_s64(int64x2_t __p0) { 60508 uint64x2_t __ret; 60509 __ret = (uint64x2_t)(__p0); 60510 return __ret; 60511 } 60512 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_mf8(mfloat8x16_t __p0) { 60513 uint64x2_t __ret; 60514 __ret = (uint64x2_t)(__p0); 60515 return __ret; 60516 } 60517 __ai __attribute__((target("neon"))) uint64x2_t vreinterpretq_u64_s16(int16x8_t __p0) { 60518 uint64x2_t __ret; 60519 __ret = (uint64x2_t)(__p0); 60520 return __ret; 60521 } 60522 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_p8(poly8x16_t __p0) { 60523 uint16x8_t __ret; 60524 __ret = (uint16x8_t)(__p0); 60525 return __ret; 60526 } 60527 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_p128(poly128_t __p0) { 60528 uint16x8_t __ret; 60529 __ret = (uint16x8_t)(__p0); 60530 return __ret; 60531 } 60532 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_p64(poly64x2_t __p0) { 60533 uint16x8_t __ret; 60534 __ret = (uint16x8_t)(__p0); 60535 return __ret; 60536 } 60537 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_p16(poly16x8_t __p0) { 60538 uint16x8_t __ret; 60539 __ret = (uint16x8_t)(__p0); 60540 return __ret; 60541 } 60542 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_u8(uint8x16_t __p0) { 60543 uint16x8_t __ret; 60544 __ret = (uint16x8_t)(__p0); 60545 return __ret; 60546 } 60547 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_u32(uint32x4_t __p0) { 60548 uint16x8_t __ret; 60549 __ret = (uint16x8_t)(__p0); 60550 return __ret; 60551 } 60552 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_u64(uint64x2_t __p0) { 60553 uint16x8_t __ret; 60554 __ret = (uint16x8_t)(__p0); 60555 return __ret; 60556 } 60557 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_s8(int8x16_t __p0) { 60558 uint16x8_t __ret; 60559 __ret = (uint16x8_t)(__p0); 60560 return __ret; 60561 } 60562 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_f64(float64x2_t __p0) { 60563 uint16x8_t __ret; 60564 __ret = (uint16x8_t)(__p0); 60565 return __ret; 60566 } 60567 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_f32(float32x4_t __p0) { 60568 uint16x8_t __ret; 60569 __ret = (uint16x8_t)(__p0); 60570 return __ret; 60571 } 60572 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_f16(float16x8_t __p0) { 60573 uint16x8_t __ret; 60574 __ret = (uint16x8_t)(__p0); 60575 return __ret; 60576 } 60577 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_s32(int32x4_t __p0) { 60578 uint16x8_t __ret; 60579 __ret = (uint16x8_t)(__p0); 60580 return __ret; 60581 } 60582 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_s64(int64x2_t __p0) { 60583 uint16x8_t __ret; 60584 __ret = (uint16x8_t)(__p0); 60585 return __ret; 60586 } 60587 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_mf8(mfloat8x16_t __p0) { 60588 uint16x8_t __ret; 60589 __ret = (uint16x8_t)(__p0); 60590 return __ret; 60591 } 60592 __ai __attribute__((target("neon"))) uint16x8_t vreinterpretq_u16_s16(int16x8_t __p0) { 60593 uint16x8_t __ret; 60594 __ret = (uint16x8_t)(__p0); 60595 return __ret; 60596 } 60597 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_p8(poly8x16_t __p0) { 60598 int8x16_t __ret; 60599 __ret = (int8x16_t)(__p0); 60600 return __ret; 60601 } 60602 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_p128(poly128_t __p0) { 60603 int8x16_t __ret; 60604 __ret = (int8x16_t)(__p0); 60605 return __ret; 60606 } 60607 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_p64(poly64x2_t __p0) { 60608 int8x16_t __ret; 60609 __ret = (int8x16_t)(__p0); 60610 return __ret; 60611 } 60612 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_p16(poly16x8_t __p0) { 60613 int8x16_t __ret; 60614 __ret = (int8x16_t)(__p0); 60615 return __ret; 60616 } 60617 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_u8(uint8x16_t __p0) { 60618 int8x16_t __ret; 60619 __ret = (int8x16_t)(__p0); 60620 return __ret; 60621 } 60622 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_u32(uint32x4_t __p0) { 60623 int8x16_t __ret; 60624 __ret = (int8x16_t)(__p0); 60625 return __ret; 60626 } 60627 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_u64(uint64x2_t __p0) { 60628 int8x16_t __ret; 60629 __ret = (int8x16_t)(__p0); 60630 return __ret; 60631 } 60632 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_u16(uint16x8_t __p0) { 60633 int8x16_t __ret; 60634 __ret = (int8x16_t)(__p0); 60635 return __ret; 60636 } 60637 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_f64(float64x2_t __p0) { 60638 int8x16_t __ret; 60639 __ret = (int8x16_t)(__p0); 60640 return __ret; 60641 } 60642 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_f32(float32x4_t __p0) { 60643 int8x16_t __ret; 60644 __ret = (int8x16_t)(__p0); 60645 return __ret; 60646 } 60647 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_f16(float16x8_t __p0) { 60648 int8x16_t __ret; 60649 __ret = (int8x16_t)(__p0); 60650 return __ret; 60651 } 60652 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_s32(int32x4_t __p0) { 60653 int8x16_t __ret; 60654 __ret = (int8x16_t)(__p0); 60655 return __ret; 60656 } 60657 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_s64(int64x2_t __p0) { 60658 int8x16_t __ret; 60659 __ret = (int8x16_t)(__p0); 60660 return __ret; 60661 } 60662 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_mf8(mfloat8x16_t __p0) { 60663 int8x16_t __ret; 60664 __ret = (int8x16_t)(__p0); 60665 return __ret; 60666 } 60667 __ai __attribute__((target("neon"))) int8x16_t vreinterpretq_s8_s16(int16x8_t __p0) { 60668 int8x16_t __ret; 60669 __ret = (int8x16_t)(__p0); 60670 return __ret; 60671 } 60672 __ai __attribute__((target("neon"))) float64x2_t vreinterpretq_f64_p8(poly8x16_t __p0) { 60673 float64x2_t __ret; 60674 __ret = (float64x2_t)(__p0); 60675 return __ret; 60676 } 60677 __ai __attribute__((target("neon"))) float64x2_t vreinterpretq_f64_p128(poly128_t __p0) { 60678 float64x2_t __ret; 60679 __ret = (float64x2_t)(__p0); 60680 return __ret; 60681 } 60682 __ai __attribute__((target("neon"))) float64x2_t vreinterpretq_f64_p64(poly64x2_t __p0) { 60683 float64x2_t __ret; 60684 __ret = (float64x2_t)(__p0); 60685 return __ret; 60686 } 60687 __ai __attribute__((target("neon"))) float64x2_t vreinterpretq_f64_p16(poly16x8_t __p0) { 60688 float64x2_t __ret; 60689 __ret = (float64x2_t)(__p0); 60690 return __ret; 60691 } 60692 __ai __attribute__((target("neon"))) float64x2_t vreinterpretq_f64_u8(uint8x16_t __p0) { 60693 float64x2_t __ret; 60694 __ret = (float64x2_t)(__p0); 60695 return __ret; 60696 } 60697 __ai __attribute__((target("neon"))) float64x2_t vreinterpretq_f64_u32(uint32x4_t __p0) { 60698 float64x2_t __ret; 60699 __ret = (float64x2_t)(__p0); 60700 return __ret; 60701 } 60702 __ai __attribute__((target("neon"))) float64x2_t vreinterpretq_f64_u64(uint64x2_t __p0) { 60703 float64x2_t __ret; 60704 __ret = (float64x2_t)(__p0); 60705 return __ret; 60706 } 60707 __ai __attribute__((target("neon"))) float64x2_t vreinterpretq_f64_u16(uint16x8_t __p0) { 60708 float64x2_t __ret; 60709 __ret = (float64x2_t)(__p0); 60710 return __ret; 60711 } 60712 __ai __attribute__((target("neon"))) float64x2_t vreinterpretq_f64_s8(int8x16_t __p0) { 60713 float64x2_t __ret; 60714 __ret = (float64x2_t)(__p0); 60715 return __ret; 60716 } 60717 __ai __attribute__((target("neon"))) float64x2_t vreinterpretq_f64_f32(float32x4_t __p0) { 60718 float64x2_t __ret; 60719 __ret = (float64x2_t)(__p0); 60720 return __ret; 60721 } 60722 __ai __attribute__((target("neon"))) float64x2_t vreinterpretq_f64_f16(float16x8_t __p0) { 60723 float64x2_t __ret; 60724 __ret = (float64x2_t)(__p0); 60725 return __ret; 60726 } 60727 __ai __attribute__((target("neon"))) float64x2_t vreinterpretq_f64_s32(int32x4_t __p0) { 60728 float64x2_t __ret; 60729 __ret = (float64x2_t)(__p0); 60730 return __ret; 60731 } 60732 __ai __attribute__((target("neon"))) float64x2_t vreinterpretq_f64_s64(int64x2_t __p0) { 60733 float64x2_t __ret; 60734 __ret = (float64x2_t)(__p0); 60735 return __ret; 60736 } 60737 __ai __attribute__((target("neon"))) float64x2_t vreinterpretq_f64_mf8(mfloat8x16_t __p0) { 60738 float64x2_t __ret; 60739 __ret = (float64x2_t)(__p0); 60740 return __ret; 60741 } 60742 __ai __attribute__((target("neon"))) float64x2_t vreinterpretq_f64_s16(int16x8_t __p0) { 60743 float64x2_t __ret; 60744 __ret = (float64x2_t)(__p0); 60745 return __ret; 60746 } 60747 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_p8(poly8x16_t __p0) { 60748 float32x4_t __ret; 60749 __ret = (float32x4_t)(__p0); 60750 return __ret; 60751 } 60752 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_p128(poly128_t __p0) { 60753 float32x4_t __ret; 60754 __ret = (float32x4_t)(__p0); 60755 return __ret; 60756 } 60757 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_p64(poly64x2_t __p0) { 60758 float32x4_t __ret; 60759 __ret = (float32x4_t)(__p0); 60760 return __ret; 60761 } 60762 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_p16(poly16x8_t __p0) { 60763 float32x4_t __ret; 60764 __ret = (float32x4_t)(__p0); 60765 return __ret; 60766 } 60767 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_u8(uint8x16_t __p0) { 60768 float32x4_t __ret; 60769 __ret = (float32x4_t)(__p0); 60770 return __ret; 60771 } 60772 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_u32(uint32x4_t __p0) { 60773 float32x4_t __ret; 60774 __ret = (float32x4_t)(__p0); 60775 return __ret; 60776 } 60777 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_u64(uint64x2_t __p0) { 60778 float32x4_t __ret; 60779 __ret = (float32x4_t)(__p0); 60780 return __ret; 60781 } 60782 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_u16(uint16x8_t __p0) { 60783 float32x4_t __ret; 60784 __ret = (float32x4_t)(__p0); 60785 return __ret; 60786 } 60787 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_s8(int8x16_t __p0) { 60788 float32x4_t __ret; 60789 __ret = (float32x4_t)(__p0); 60790 return __ret; 60791 } 60792 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_f64(float64x2_t __p0) { 60793 float32x4_t __ret; 60794 __ret = (float32x4_t)(__p0); 60795 return __ret; 60796 } 60797 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_f16(float16x8_t __p0) { 60798 float32x4_t __ret; 60799 __ret = (float32x4_t)(__p0); 60800 return __ret; 60801 } 60802 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_s32(int32x4_t __p0) { 60803 float32x4_t __ret; 60804 __ret = (float32x4_t)(__p0); 60805 return __ret; 60806 } 60807 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_s64(int64x2_t __p0) { 60808 float32x4_t __ret; 60809 __ret = (float32x4_t)(__p0); 60810 return __ret; 60811 } 60812 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_mf8(mfloat8x16_t __p0) { 60813 float32x4_t __ret; 60814 __ret = (float32x4_t)(__p0); 60815 return __ret; 60816 } 60817 __ai __attribute__((target("neon"))) float32x4_t vreinterpretq_f32_s16(int16x8_t __p0) { 60818 float32x4_t __ret; 60819 __ret = (float32x4_t)(__p0); 60820 return __ret; 60821 } 60822 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_p8(poly8x16_t __p0) { 60823 float16x8_t __ret; 60824 __ret = (float16x8_t)(__p0); 60825 return __ret; 60826 } 60827 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_p128(poly128_t __p0) { 60828 float16x8_t __ret; 60829 __ret = (float16x8_t)(__p0); 60830 return __ret; 60831 } 60832 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_p64(poly64x2_t __p0) { 60833 float16x8_t __ret; 60834 __ret = (float16x8_t)(__p0); 60835 return __ret; 60836 } 60837 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_p16(poly16x8_t __p0) { 60838 float16x8_t __ret; 60839 __ret = (float16x8_t)(__p0); 60840 return __ret; 60841 } 60842 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_u8(uint8x16_t __p0) { 60843 float16x8_t __ret; 60844 __ret = (float16x8_t)(__p0); 60845 return __ret; 60846 } 60847 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_u32(uint32x4_t __p0) { 60848 float16x8_t __ret; 60849 __ret = (float16x8_t)(__p0); 60850 return __ret; 60851 } 60852 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_u64(uint64x2_t __p0) { 60853 float16x8_t __ret; 60854 __ret = (float16x8_t)(__p0); 60855 return __ret; 60856 } 60857 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_u16(uint16x8_t __p0) { 60858 float16x8_t __ret; 60859 __ret = (float16x8_t)(__p0); 60860 return __ret; 60861 } 60862 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_s8(int8x16_t __p0) { 60863 float16x8_t __ret; 60864 __ret = (float16x8_t)(__p0); 60865 return __ret; 60866 } 60867 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_f64(float64x2_t __p0) { 60868 float16x8_t __ret; 60869 __ret = (float16x8_t)(__p0); 60870 return __ret; 60871 } 60872 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_f32(float32x4_t __p0) { 60873 float16x8_t __ret; 60874 __ret = (float16x8_t)(__p0); 60875 return __ret; 60876 } 60877 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_s32(int32x4_t __p0) { 60878 float16x8_t __ret; 60879 __ret = (float16x8_t)(__p0); 60880 return __ret; 60881 } 60882 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_s64(int64x2_t __p0) { 60883 float16x8_t __ret; 60884 __ret = (float16x8_t)(__p0); 60885 return __ret; 60886 } 60887 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_mf8(mfloat8x16_t __p0) { 60888 float16x8_t __ret; 60889 __ret = (float16x8_t)(__p0); 60890 return __ret; 60891 } 60892 __ai __attribute__((target("neon"))) float16x8_t vreinterpretq_f16_s16(int16x8_t __p0) { 60893 float16x8_t __ret; 60894 __ret = (float16x8_t)(__p0); 60895 return __ret; 60896 } 60897 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_p8(poly8x16_t __p0) { 60898 int32x4_t __ret; 60899 __ret = (int32x4_t)(__p0); 60900 return __ret; 60901 } 60902 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_p128(poly128_t __p0) { 60903 int32x4_t __ret; 60904 __ret = (int32x4_t)(__p0); 60905 return __ret; 60906 } 60907 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_p64(poly64x2_t __p0) { 60908 int32x4_t __ret; 60909 __ret = (int32x4_t)(__p0); 60910 return __ret; 60911 } 60912 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_p16(poly16x8_t __p0) { 60913 int32x4_t __ret; 60914 __ret = (int32x4_t)(__p0); 60915 return __ret; 60916 } 60917 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_u8(uint8x16_t __p0) { 60918 int32x4_t __ret; 60919 __ret = (int32x4_t)(__p0); 60920 return __ret; 60921 } 60922 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_u32(uint32x4_t __p0) { 60923 int32x4_t __ret; 60924 __ret = (int32x4_t)(__p0); 60925 return __ret; 60926 } 60927 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_u64(uint64x2_t __p0) { 60928 int32x4_t __ret; 60929 __ret = (int32x4_t)(__p0); 60930 return __ret; 60931 } 60932 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_u16(uint16x8_t __p0) { 60933 int32x4_t __ret; 60934 __ret = (int32x4_t)(__p0); 60935 return __ret; 60936 } 60937 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_s8(int8x16_t __p0) { 60938 int32x4_t __ret; 60939 __ret = (int32x4_t)(__p0); 60940 return __ret; 60941 } 60942 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_f64(float64x2_t __p0) { 60943 int32x4_t __ret; 60944 __ret = (int32x4_t)(__p0); 60945 return __ret; 60946 } 60947 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_f32(float32x4_t __p0) { 60948 int32x4_t __ret; 60949 __ret = (int32x4_t)(__p0); 60950 return __ret; 60951 } 60952 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_f16(float16x8_t __p0) { 60953 int32x4_t __ret; 60954 __ret = (int32x4_t)(__p0); 60955 return __ret; 60956 } 60957 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_s64(int64x2_t __p0) { 60958 int32x4_t __ret; 60959 __ret = (int32x4_t)(__p0); 60960 return __ret; 60961 } 60962 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_mf8(mfloat8x16_t __p0) { 60963 int32x4_t __ret; 60964 __ret = (int32x4_t)(__p0); 60965 return __ret; 60966 } 60967 __ai __attribute__((target("neon"))) int32x4_t vreinterpretq_s32_s16(int16x8_t __p0) { 60968 int32x4_t __ret; 60969 __ret = (int32x4_t)(__p0); 60970 return __ret; 60971 } 60972 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_p8(poly8x16_t __p0) { 60973 int64x2_t __ret; 60974 __ret = (int64x2_t)(__p0); 60975 return __ret; 60976 } 60977 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_p128(poly128_t __p0) { 60978 int64x2_t __ret; 60979 __ret = (int64x2_t)(__p0); 60980 return __ret; 60981 } 60982 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_p64(poly64x2_t __p0) { 60983 int64x2_t __ret; 60984 __ret = (int64x2_t)(__p0); 60985 return __ret; 60986 } 60987 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_p16(poly16x8_t __p0) { 60988 int64x2_t __ret; 60989 __ret = (int64x2_t)(__p0); 60990 return __ret; 60991 } 60992 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_u8(uint8x16_t __p0) { 60993 int64x2_t __ret; 60994 __ret = (int64x2_t)(__p0); 60995 return __ret; 60996 } 60997 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_u32(uint32x4_t __p0) { 60998 int64x2_t __ret; 60999 __ret = (int64x2_t)(__p0); 61000 return __ret; 61001 } 61002 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_u64(uint64x2_t __p0) { 61003 int64x2_t __ret; 61004 __ret = (int64x2_t)(__p0); 61005 return __ret; 61006 } 61007 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_u16(uint16x8_t __p0) { 61008 int64x2_t __ret; 61009 __ret = (int64x2_t)(__p0); 61010 return __ret; 61011 } 61012 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_s8(int8x16_t __p0) { 61013 int64x2_t __ret; 61014 __ret = (int64x2_t)(__p0); 61015 return __ret; 61016 } 61017 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_f64(float64x2_t __p0) { 61018 int64x2_t __ret; 61019 __ret = (int64x2_t)(__p0); 61020 return __ret; 61021 } 61022 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_f32(float32x4_t __p0) { 61023 int64x2_t __ret; 61024 __ret = (int64x2_t)(__p0); 61025 return __ret; 61026 } 61027 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_f16(float16x8_t __p0) { 61028 int64x2_t __ret; 61029 __ret = (int64x2_t)(__p0); 61030 return __ret; 61031 } 61032 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_s32(int32x4_t __p0) { 61033 int64x2_t __ret; 61034 __ret = (int64x2_t)(__p0); 61035 return __ret; 61036 } 61037 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_mf8(mfloat8x16_t __p0) { 61038 int64x2_t __ret; 61039 __ret = (int64x2_t)(__p0); 61040 return __ret; 61041 } 61042 __ai __attribute__((target("neon"))) int64x2_t vreinterpretq_s64_s16(int16x8_t __p0) { 61043 int64x2_t __ret; 61044 __ret = (int64x2_t)(__p0); 61045 return __ret; 61046 } 61047 __ai __attribute__((target("neon"))) mfloat8x16_t vreinterpretq_mf8_p8(poly8x16_t __p0) { 61048 mfloat8x16_t __ret; 61049 __ret = (mfloat8x16_t)(__p0); 61050 return __ret; 61051 } 61052 __ai __attribute__((target("neon"))) mfloat8x16_t vreinterpretq_mf8_p128(poly128_t __p0) { 61053 mfloat8x16_t __ret; 61054 __ret = (mfloat8x16_t)(__p0); 61055 return __ret; 61056 } 61057 __ai __attribute__((target("neon"))) mfloat8x16_t vreinterpretq_mf8_p64(poly64x2_t __p0) { 61058 mfloat8x16_t __ret; 61059 __ret = (mfloat8x16_t)(__p0); 61060 return __ret; 61061 } 61062 __ai __attribute__((target("neon"))) mfloat8x16_t vreinterpretq_mf8_p16(poly16x8_t __p0) { 61063 mfloat8x16_t __ret; 61064 __ret = (mfloat8x16_t)(__p0); 61065 return __ret; 61066 } 61067 __ai __attribute__((target("neon"))) mfloat8x16_t vreinterpretq_mf8_u8(uint8x16_t __p0) { 61068 mfloat8x16_t __ret; 61069 __ret = (mfloat8x16_t)(__p0); 61070 return __ret; 61071 } 61072 __ai __attribute__((target("neon"))) mfloat8x16_t vreinterpretq_mf8_u32(uint32x4_t __p0) { 61073 mfloat8x16_t __ret; 61074 __ret = (mfloat8x16_t)(__p0); 61075 return __ret; 61076 } 61077 __ai __attribute__((target("neon"))) mfloat8x16_t vreinterpretq_mf8_u64(uint64x2_t __p0) { 61078 mfloat8x16_t __ret; 61079 __ret = (mfloat8x16_t)(__p0); 61080 return __ret; 61081 } 61082 __ai __attribute__((target("neon"))) mfloat8x16_t vreinterpretq_mf8_u16(uint16x8_t __p0) { 61083 mfloat8x16_t __ret; 61084 __ret = (mfloat8x16_t)(__p0); 61085 return __ret; 61086 } 61087 __ai __attribute__((target("neon"))) mfloat8x16_t vreinterpretq_mf8_s8(int8x16_t __p0) { 61088 mfloat8x16_t __ret; 61089 __ret = (mfloat8x16_t)(__p0); 61090 return __ret; 61091 } 61092 __ai __attribute__((target("neon"))) mfloat8x16_t vreinterpretq_mf8_f64(float64x2_t __p0) { 61093 mfloat8x16_t __ret; 61094 __ret = (mfloat8x16_t)(__p0); 61095 return __ret; 61096 } 61097 __ai __attribute__((target("neon"))) mfloat8x16_t vreinterpretq_mf8_f32(float32x4_t __p0) { 61098 mfloat8x16_t __ret; 61099 __ret = (mfloat8x16_t)(__p0); 61100 return __ret; 61101 } 61102 __ai __attribute__((target("neon"))) mfloat8x16_t vreinterpretq_mf8_f16(float16x8_t __p0) { 61103 mfloat8x16_t __ret; 61104 __ret = (mfloat8x16_t)(__p0); 61105 return __ret; 61106 } 61107 __ai __attribute__((target("neon"))) mfloat8x16_t vreinterpretq_mf8_s32(int32x4_t __p0) { 61108 mfloat8x16_t __ret; 61109 __ret = (mfloat8x16_t)(__p0); 61110 return __ret; 61111 } 61112 __ai __attribute__((target("neon"))) mfloat8x16_t vreinterpretq_mf8_s64(int64x2_t __p0) { 61113 mfloat8x16_t __ret; 61114 __ret = (mfloat8x16_t)(__p0); 61115 return __ret; 61116 } 61117 __ai __attribute__((target("neon"))) mfloat8x16_t vreinterpretq_mf8_s16(int16x8_t __p0) { 61118 mfloat8x16_t __ret; 61119 __ret = (mfloat8x16_t)(__p0); 61120 return __ret; 61121 } 61122 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_p8(poly8x16_t __p0) { 61123 int16x8_t __ret; 61124 __ret = (int16x8_t)(__p0); 61125 return __ret; 61126 } 61127 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_p128(poly128_t __p0) { 61128 int16x8_t __ret; 61129 __ret = (int16x8_t)(__p0); 61130 return __ret; 61131 } 61132 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_p64(poly64x2_t __p0) { 61133 int16x8_t __ret; 61134 __ret = (int16x8_t)(__p0); 61135 return __ret; 61136 } 61137 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_p16(poly16x8_t __p0) { 61138 int16x8_t __ret; 61139 __ret = (int16x8_t)(__p0); 61140 return __ret; 61141 } 61142 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_u8(uint8x16_t __p0) { 61143 int16x8_t __ret; 61144 __ret = (int16x8_t)(__p0); 61145 return __ret; 61146 } 61147 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_u32(uint32x4_t __p0) { 61148 int16x8_t __ret; 61149 __ret = (int16x8_t)(__p0); 61150 return __ret; 61151 } 61152 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_u64(uint64x2_t __p0) { 61153 int16x8_t __ret; 61154 __ret = (int16x8_t)(__p0); 61155 return __ret; 61156 } 61157 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_u16(uint16x8_t __p0) { 61158 int16x8_t __ret; 61159 __ret = (int16x8_t)(__p0); 61160 return __ret; 61161 } 61162 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_s8(int8x16_t __p0) { 61163 int16x8_t __ret; 61164 __ret = (int16x8_t)(__p0); 61165 return __ret; 61166 } 61167 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_f64(float64x2_t __p0) { 61168 int16x8_t __ret; 61169 __ret = (int16x8_t)(__p0); 61170 return __ret; 61171 } 61172 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_f32(float32x4_t __p0) { 61173 int16x8_t __ret; 61174 __ret = (int16x8_t)(__p0); 61175 return __ret; 61176 } 61177 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_f16(float16x8_t __p0) { 61178 int16x8_t __ret; 61179 __ret = (int16x8_t)(__p0); 61180 return __ret; 61181 } 61182 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_s32(int32x4_t __p0) { 61183 int16x8_t __ret; 61184 __ret = (int16x8_t)(__p0); 61185 return __ret; 61186 } 61187 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_s64(int64x2_t __p0) { 61188 int16x8_t __ret; 61189 __ret = (int16x8_t)(__p0); 61190 return __ret; 61191 } 61192 __ai __attribute__((target("neon"))) int16x8_t vreinterpretq_s16_mf8(mfloat8x16_t __p0) { 61193 int16x8_t __ret; 61194 __ret = (int16x8_t)(__p0); 61195 return __ret; 61196 } 61197 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_p8(poly8x8_t __p0) { 61198 uint8x8_t __ret; 61199 __ret = (uint8x8_t)(__p0); 61200 return __ret; 61201 } 61202 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_p64(poly64x1_t __p0) { 61203 uint8x8_t __ret; 61204 __ret = (uint8x8_t)(__p0); 61205 return __ret; 61206 } 61207 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_p16(poly16x4_t __p0) { 61208 uint8x8_t __ret; 61209 __ret = (uint8x8_t)(__p0); 61210 return __ret; 61211 } 61212 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_u32(uint32x2_t __p0) { 61213 uint8x8_t __ret; 61214 __ret = (uint8x8_t)(__p0); 61215 return __ret; 61216 } 61217 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_u64(uint64x1_t __p0) { 61218 uint8x8_t __ret; 61219 __ret = (uint8x8_t)(__p0); 61220 return __ret; 61221 } 61222 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_u16(uint16x4_t __p0) { 61223 uint8x8_t __ret; 61224 __ret = (uint8x8_t)(__p0); 61225 return __ret; 61226 } 61227 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_s8(int8x8_t __p0) { 61228 uint8x8_t __ret; 61229 __ret = (uint8x8_t)(__p0); 61230 return __ret; 61231 } 61232 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_f64(float64x1_t __p0) { 61233 uint8x8_t __ret; 61234 __ret = (uint8x8_t)(__p0); 61235 return __ret; 61236 } 61237 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_f32(float32x2_t __p0) { 61238 uint8x8_t __ret; 61239 __ret = (uint8x8_t)(__p0); 61240 return __ret; 61241 } 61242 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_f16(float16x4_t __p0) { 61243 uint8x8_t __ret; 61244 __ret = (uint8x8_t)(__p0); 61245 return __ret; 61246 } 61247 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_s32(int32x2_t __p0) { 61248 uint8x8_t __ret; 61249 __ret = (uint8x8_t)(__p0); 61250 return __ret; 61251 } 61252 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_s64(int64x1_t __p0) { 61253 uint8x8_t __ret; 61254 __ret = (uint8x8_t)(__p0); 61255 return __ret; 61256 } 61257 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_mf8(mfloat8x8_t __p0) { 61258 uint8x8_t __ret; 61259 __ret = (uint8x8_t)(__p0); 61260 return __ret; 61261 } 61262 __ai __attribute__((target("neon"))) uint8x8_t vreinterpret_u8_s16(int16x4_t __p0) { 61263 uint8x8_t __ret; 61264 __ret = (uint8x8_t)(__p0); 61265 return __ret; 61266 } 61267 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_p8(poly8x8_t __p0) { 61268 uint32x2_t __ret; 61269 __ret = (uint32x2_t)(__p0); 61270 return __ret; 61271 } 61272 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_p64(poly64x1_t __p0) { 61273 uint32x2_t __ret; 61274 __ret = (uint32x2_t)(__p0); 61275 return __ret; 61276 } 61277 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_p16(poly16x4_t __p0) { 61278 uint32x2_t __ret; 61279 __ret = (uint32x2_t)(__p0); 61280 return __ret; 61281 } 61282 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_u8(uint8x8_t __p0) { 61283 uint32x2_t __ret; 61284 __ret = (uint32x2_t)(__p0); 61285 return __ret; 61286 } 61287 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_u64(uint64x1_t __p0) { 61288 uint32x2_t __ret; 61289 __ret = (uint32x2_t)(__p0); 61290 return __ret; 61291 } 61292 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_u16(uint16x4_t __p0) { 61293 uint32x2_t __ret; 61294 __ret = (uint32x2_t)(__p0); 61295 return __ret; 61296 } 61297 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_s8(int8x8_t __p0) { 61298 uint32x2_t __ret; 61299 __ret = (uint32x2_t)(__p0); 61300 return __ret; 61301 } 61302 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_f64(float64x1_t __p0) { 61303 uint32x2_t __ret; 61304 __ret = (uint32x2_t)(__p0); 61305 return __ret; 61306 } 61307 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_f32(float32x2_t __p0) { 61308 uint32x2_t __ret; 61309 __ret = (uint32x2_t)(__p0); 61310 return __ret; 61311 } 61312 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_f16(float16x4_t __p0) { 61313 uint32x2_t __ret; 61314 __ret = (uint32x2_t)(__p0); 61315 return __ret; 61316 } 61317 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_s32(int32x2_t __p0) { 61318 uint32x2_t __ret; 61319 __ret = (uint32x2_t)(__p0); 61320 return __ret; 61321 } 61322 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_s64(int64x1_t __p0) { 61323 uint32x2_t __ret; 61324 __ret = (uint32x2_t)(__p0); 61325 return __ret; 61326 } 61327 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_mf8(mfloat8x8_t __p0) { 61328 uint32x2_t __ret; 61329 __ret = (uint32x2_t)(__p0); 61330 return __ret; 61331 } 61332 __ai __attribute__((target("neon"))) uint32x2_t vreinterpret_u32_s16(int16x4_t __p0) { 61333 uint32x2_t __ret; 61334 __ret = (uint32x2_t)(__p0); 61335 return __ret; 61336 } 61337 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_p8(poly8x8_t __p0) { 61338 uint64x1_t __ret; 61339 __ret = (uint64x1_t)(__p0); 61340 return __ret; 61341 } 61342 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_p64(poly64x1_t __p0) { 61343 uint64x1_t __ret; 61344 __ret = (uint64x1_t)(__p0); 61345 return __ret; 61346 } 61347 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_p16(poly16x4_t __p0) { 61348 uint64x1_t __ret; 61349 __ret = (uint64x1_t)(__p0); 61350 return __ret; 61351 } 61352 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_u8(uint8x8_t __p0) { 61353 uint64x1_t __ret; 61354 __ret = (uint64x1_t)(__p0); 61355 return __ret; 61356 } 61357 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_u32(uint32x2_t __p0) { 61358 uint64x1_t __ret; 61359 __ret = (uint64x1_t)(__p0); 61360 return __ret; 61361 } 61362 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_u16(uint16x4_t __p0) { 61363 uint64x1_t __ret; 61364 __ret = (uint64x1_t)(__p0); 61365 return __ret; 61366 } 61367 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_s8(int8x8_t __p0) { 61368 uint64x1_t __ret; 61369 __ret = (uint64x1_t)(__p0); 61370 return __ret; 61371 } 61372 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_f64(float64x1_t __p0) { 61373 uint64x1_t __ret; 61374 __ret = (uint64x1_t)(__p0); 61375 return __ret; 61376 } 61377 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_f32(float32x2_t __p0) { 61378 uint64x1_t __ret; 61379 __ret = (uint64x1_t)(__p0); 61380 return __ret; 61381 } 61382 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_f16(float16x4_t __p0) { 61383 uint64x1_t __ret; 61384 __ret = (uint64x1_t)(__p0); 61385 return __ret; 61386 } 61387 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_s32(int32x2_t __p0) { 61388 uint64x1_t __ret; 61389 __ret = (uint64x1_t)(__p0); 61390 return __ret; 61391 } 61392 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_s64(int64x1_t __p0) { 61393 uint64x1_t __ret; 61394 __ret = (uint64x1_t)(__p0); 61395 return __ret; 61396 } 61397 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_mf8(mfloat8x8_t __p0) { 61398 uint64x1_t __ret; 61399 __ret = (uint64x1_t)(__p0); 61400 return __ret; 61401 } 61402 __ai __attribute__((target("neon"))) uint64x1_t vreinterpret_u64_s16(int16x4_t __p0) { 61403 uint64x1_t __ret; 61404 __ret = (uint64x1_t)(__p0); 61405 return __ret; 61406 } 61407 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_p8(poly8x8_t __p0) { 61408 uint16x4_t __ret; 61409 __ret = (uint16x4_t)(__p0); 61410 return __ret; 61411 } 61412 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_p64(poly64x1_t __p0) { 61413 uint16x4_t __ret; 61414 __ret = (uint16x4_t)(__p0); 61415 return __ret; 61416 } 61417 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_p16(poly16x4_t __p0) { 61418 uint16x4_t __ret; 61419 __ret = (uint16x4_t)(__p0); 61420 return __ret; 61421 } 61422 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_u8(uint8x8_t __p0) { 61423 uint16x4_t __ret; 61424 __ret = (uint16x4_t)(__p0); 61425 return __ret; 61426 } 61427 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_u32(uint32x2_t __p0) { 61428 uint16x4_t __ret; 61429 __ret = (uint16x4_t)(__p0); 61430 return __ret; 61431 } 61432 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_u64(uint64x1_t __p0) { 61433 uint16x4_t __ret; 61434 __ret = (uint16x4_t)(__p0); 61435 return __ret; 61436 } 61437 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_s8(int8x8_t __p0) { 61438 uint16x4_t __ret; 61439 __ret = (uint16x4_t)(__p0); 61440 return __ret; 61441 } 61442 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_f64(float64x1_t __p0) { 61443 uint16x4_t __ret; 61444 __ret = (uint16x4_t)(__p0); 61445 return __ret; 61446 } 61447 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_f32(float32x2_t __p0) { 61448 uint16x4_t __ret; 61449 __ret = (uint16x4_t)(__p0); 61450 return __ret; 61451 } 61452 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_f16(float16x4_t __p0) { 61453 uint16x4_t __ret; 61454 __ret = (uint16x4_t)(__p0); 61455 return __ret; 61456 } 61457 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_s32(int32x2_t __p0) { 61458 uint16x4_t __ret; 61459 __ret = (uint16x4_t)(__p0); 61460 return __ret; 61461 } 61462 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_s64(int64x1_t __p0) { 61463 uint16x4_t __ret; 61464 __ret = (uint16x4_t)(__p0); 61465 return __ret; 61466 } 61467 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_mf8(mfloat8x8_t __p0) { 61468 uint16x4_t __ret; 61469 __ret = (uint16x4_t)(__p0); 61470 return __ret; 61471 } 61472 __ai __attribute__((target("neon"))) uint16x4_t vreinterpret_u16_s16(int16x4_t __p0) { 61473 uint16x4_t __ret; 61474 __ret = (uint16x4_t)(__p0); 61475 return __ret; 61476 } 61477 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_p8(poly8x8_t __p0) { 61478 int8x8_t __ret; 61479 __ret = (int8x8_t)(__p0); 61480 return __ret; 61481 } 61482 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_p64(poly64x1_t __p0) { 61483 int8x8_t __ret; 61484 __ret = (int8x8_t)(__p0); 61485 return __ret; 61486 } 61487 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_p16(poly16x4_t __p0) { 61488 int8x8_t __ret; 61489 __ret = (int8x8_t)(__p0); 61490 return __ret; 61491 } 61492 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_u8(uint8x8_t __p0) { 61493 int8x8_t __ret; 61494 __ret = (int8x8_t)(__p0); 61495 return __ret; 61496 } 61497 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_u32(uint32x2_t __p0) { 61498 int8x8_t __ret; 61499 __ret = (int8x8_t)(__p0); 61500 return __ret; 61501 } 61502 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_u64(uint64x1_t __p0) { 61503 int8x8_t __ret; 61504 __ret = (int8x8_t)(__p0); 61505 return __ret; 61506 } 61507 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_u16(uint16x4_t __p0) { 61508 int8x8_t __ret; 61509 __ret = (int8x8_t)(__p0); 61510 return __ret; 61511 } 61512 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_f64(float64x1_t __p0) { 61513 int8x8_t __ret; 61514 __ret = (int8x8_t)(__p0); 61515 return __ret; 61516 } 61517 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_f32(float32x2_t __p0) { 61518 int8x8_t __ret; 61519 __ret = (int8x8_t)(__p0); 61520 return __ret; 61521 } 61522 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_f16(float16x4_t __p0) { 61523 int8x8_t __ret; 61524 __ret = (int8x8_t)(__p0); 61525 return __ret; 61526 } 61527 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_s32(int32x2_t __p0) { 61528 int8x8_t __ret; 61529 __ret = (int8x8_t)(__p0); 61530 return __ret; 61531 } 61532 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_s64(int64x1_t __p0) { 61533 int8x8_t __ret; 61534 __ret = (int8x8_t)(__p0); 61535 return __ret; 61536 } 61537 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_mf8(mfloat8x8_t __p0) { 61538 int8x8_t __ret; 61539 __ret = (int8x8_t)(__p0); 61540 return __ret; 61541 } 61542 __ai __attribute__((target("neon"))) int8x8_t vreinterpret_s8_s16(int16x4_t __p0) { 61543 int8x8_t __ret; 61544 __ret = (int8x8_t)(__p0); 61545 return __ret; 61546 } 61547 __ai __attribute__((target("neon"))) float64x1_t vreinterpret_f64_p8(poly8x8_t __p0) { 61548 float64x1_t __ret; 61549 __ret = (float64x1_t)(__p0); 61550 return __ret; 61551 } 61552 __ai __attribute__((target("neon"))) float64x1_t vreinterpret_f64_p64(poly64x1_t __p0) { 61553 float64x1_t __ret; 61554 __ret = (float64x1_t)(__p0); 61555 return __ret; 61556 } 61557 __ai __attribute__((target("neon"))) float64x1_t vreinterpret_f64_p16(poly16x4_t __p0) { 61558 float64x1_t __ret; 61559 __ret = (float64x1_t)(__p0); 61560 return __ret; 61561 } 61562 __ai __attribute__((target("neon"))) float64x1_t vreinterpret_f64_u8(uint8x8_t __p0) { 61563 float64x1_t __ret; 61564 __ret = (float64x1_t)(__p0); 61565 return __ret; 61566 } 61567 __ai __attribute__((target("neon"))) float64x1_t vreinterpret_f64_u32(uint32x2_t __p0) { 61568 float64x1_t __ret; 61569 __ret = (float64x1_t)(__p0); 61570 return __ret; 61571 } 61572 __ai __attribute__((target("neon"))) float64x1_t vreinterpret_f64_u64(uint64x1_t __p0) { 61573 float64x1_t __ret; 61574 __ret = (float64x1_t)(__p0); 61575 return __ret; 61576 } 61577 __ai __attribute__((target("neon"))) float64x1_t vreinterpret_f64_u16(uint16x4_t __p0) { 61578 float64x1_t __ret; 61579 __ret = (float64x1_t)(__p0); 61580 return __ret; 61581 } 61582 __ai __attribute__((target("neon"))) float64x1_t vreinterpret_f64_s8(int8x8_t __p0) { 61583 float64x1_t __ret; 61584 __ret = (float64x1_t)(__p0); 61585 return __ret; 61586 } 61587 __ai __attribute__((target("neon"))) float64x1_t vreinterpret_f64_f32(float32x2_t __p0) { 61588 float64x1_t __ret; 61589 __ret = (float64x1_t)(__p0); 61590 return __ret; 61591 } 61592 __ai __attribute__((target("neon"))) float64x1_t vreinterpret_f64_f16(float16x4_t __p0) { 61593 float64x1_t __ret; 61594 __ret = (float64x1_t)(__p0); 61595 return __ret; 61596 } 61597 __ai __attribute__((target("neon"))) float64x1_t vreinterpret_f64_s32(int32x2_t __p0) { 61598 float64x1_t __ret; 61599 __ret = (float64x1_t)(__p0); 61600 return __ret; 61601 } 61602 __ai __attribute__((target("neon"))) float64x1_t vreinterpret_f64_s64(int64x1_t __p0) { 61603 float64x1_t __ret; 61604 __ret = (float64x1_t)(__p0); 61605 return __ret; 61606 } 61607 __ai __attribute__((target("neon"))) float64x1_t vreinterpret_f64_mf8(mfloat8x8_t __p0) { 61608 float64x1_t __ret; 61609 __ret = (float64x1_t)(__p0); 61610 return __ret; 61611 } 61612 __ai __attribute__((target("neon"))) float64x1_t vreinterpret_f64_s16(int16x4_t __p0) { 61613 float64x1_t __ret; 61614 __ret = (float64x1_t)(__p0); 61615 return __ret; 61616 } 61617 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_p8(poly8x8_t __p0) { 61618 float32x2_t __ret; 61619 __ret = (float32x2_t)(__p0); 61620 return __ret; 61621 } 61622 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_p64(poly64x1_t __p0) { 61623 float32x2_t __ret; 61624 __ret = (float32x2_t)(__p0); 61625 return __ret; 61626 } 61627 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_p16(poly16x4_t __p0) { 61628 float32x2_t __ret; 61629 __ret = (float32x2_t)(__p0); 61630 return __ret; 61631 } 61632 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_u8(uint8x8_t __p0) { 61633 float32x2_t __ret; 61634 __ret = (float32x2_t)(__p0); 61635 return __ret; 61636 } 61637 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_u32(uint32x2_t __p0) { 61638 float32x2_t __ret; 61639 __ret = (float32x2_t)(__p0); 61640 return __ret; 61641 } 61642 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_u64(uint64x1_t __p0) { 61643 float32x2_t __ret; 61644 __ret = (float32x2_t)(__p0); 61645 return __ret; 61646 } 61647 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_u16(uint16x4_t __p0) { 61648 float32x2_t __ret; 61649 __ret = (float32x2_t)(__p0); 61650 return __ret; 61651 } 61652 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_s8(int8x8_t __p0) { 61653 float32x2_t __ret; 61654 __ret = (float32x2_t)(__p0); 61655 return __ret; 61656 } 61657 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_f64(float64x1_t __p0) { 61658 float32x2_t __ret; 61659 __ret = (float32x2_t)(__p0); 61660 return __ret; 61661 } 61662 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_f16(float16x4_t __p0) { 61663 float32x2_t __ret; 61664 __ret = (float32x2_t)(__p0); 61665 return __ret; 61666 } 61667 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_s32(int32x2_t __p0) { 61668 float32x2_t __ret; 61669 __ret = (float32x2_t)(__p0); 61670 return __ret; 61671 } 61672 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_s64(int64x1_t __p0) { 61673 float32x2_t __ret; 61674 __ret = (float32x2_t)(__p0); 61675 return __ret; 61676 } 61677 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_mf8(mfloat8x8_t __p0) { 61678 float32x2_t __ret; 61679 __ret = (float32x2_t)(__p0); 61680 return __ret; 61681 } 61682 __ai __attribute__((target("neon"))) float32x2_t vreinterpret_f32_s16(int16x4_t __p0) { 61683 float32x2_t __ret; 61684 __ret = (float32x2_t)(__p0); 61685 return __ret; 61686 } 61687 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_p8(poly8x8_t __p0) { 61688 float16x4_t __ret; 61689 __ret = (float16x4_t)(__p0); 61690 return __ret; 61691 } 61692 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_p64(poly64x1_t __p0) { 61693 float16x4_t __ret; 61694 __ret = (float16x4_t)(__p0); 61695 return __ret; 61696 } 61697 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_p16(poly16x4_t __p0) { 61698 float16x4_t __ret; 61699 __ret = (float16x4_t)(__p0); 61700 return __ret; 61701 } 61702 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_u8(uint8x8_t __p0) { 61703 float16x4_t __ret; 61704 __ret = (float16x4_t)(__p0); 61705 return __ret; 61706 } 61707 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_u32(uint32x2_t __p0) { 61708 float16x4_t __ret; 61709 __ret = (float16x4_t)(__p0); 61710 return __ret; 61711 } 61712 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_u64(uint64x1_t __p0) { 61713 float16x4_t __ret; 61714 __ret = (float16x4_t)(__p0); 61715 return __ret; 61716 } 61717 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_u16(uint16x4_t __p0) { 61718 float16x4_t __ret; 61719 __ret = (float16x4_t)(__p0); 61720 return __ret; 61721 } 61722 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_s8(int8x8_t __p0) { 61723 float16x4_t __ret; 61724 __ret = (float16x4_t)(__p0); 61725 return __ret; 61726 } 61727 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_f64(float64x1_t __p0) { 61728 float16x4_t __ret; 61729 __ret = (float16x4_t)(__p0); 61730 return __ret; 61731 } 61732 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_f32(float32x2_t __p0) { 61733 float16x4_t __ret; 61734 __ret = (float16x4_t)(__p0); 61735 return __ret; 61736 } 61737 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_s32(int32x2_t __p0) { 61738 float16x4_t __ret; 61739 __ret = (float16x4_t)(__p0); 61740 return __ret; 61741 } 61742 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_s64(int64x1_t __p0) { 61743 float16x4_t __ret; 61744 __ret = (float16x4_t)(__p0); 61745 return __ret; 61746 } 61747 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_mf8(mfloat8x8_t __p0) { 61748 float16x4_t __ret; 61749 __ret = (float16x4_t)(__p0); 61750 return __ret; 61751 } 61752 __ai __attribute__((target("neon"))) float16x4_t vreinterpret_f16_s16(int16x4_t __p0) { 61753 float16x4_t __ret; 61754 __ret = (float16x4_t)(__p0); 61755 return __ret; 61756 } 61757 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_p8(poly8x8_t __p0) { 61758 int32x2_t __ret; 61759 __ret = (int32x2_t)(__p0); 61760 return __ret; 61761 } 61762 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_p64(poly64x1_t __p0) { 61763 int32x2_t __ret; 61764 __ret = (int32x2_t)(__p0); 61765 return __ret; 61766 } 61767 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_p16(poly16x4_t __p0) { 61768 int32x2_t __ret; 61769 __ret = (int32x2_t)(__p0); 61770 return __ret; 61771 } 61772 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_u8(uint8x8_t __p0) { 61773 int32x2_t __ret; 61774 __ret = (int32x2_t)(__p0); 61775 return __ret; 61776 } 61777 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_u32(uint32x2_t __p0) { 61778 int32x2_t __ret; 61779 __ret = (int32x2_t)(__p0); 61780 return __ret; 61781 } 61782 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_u64(uint64x1_t __p0) { 61783 int32x2_t __ret; 61784 __ret = (int32x2_t)(__p0); 61785 return __ret; 61786 } 61787 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_u16(uint16x4_t __p0) { 61788 int32x2_t __ret; 61789 __ret = (int32x2_t)(__p0); 61790 return __ret; 61791 } 61792 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_s8(int8x8_t __p0) { 61793 int32x2_t __ret; 61794 __ret = (int32x2_t)(__p0); 61795 return __ret; 61796 } 61797 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_f64(float64x1_t __p0) { 61798 int32x2_t __ret; 61799 __ret = (int32x2_t)(__p0); 61800 return __ret; 61801 } 61802 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_f32(float32x2_t __p0) { 61803 int32x2_t __ret; 61804 __ret = (int32x2_t)(__p0); 61805 return __ret; 61806 } 61807 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_f16(float16x4_t __p0) { 61808 int32x2_t __ret; 61809 __ret = (int32x2_t)(__p0); 61810 return __ret; 61811 } 61812 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_s64(int64x1_t __p0) { 61813 int32x2_t __ret; 61814 __ret = (int32x2_t)(__p0); 61815 return __ret; 61816 } 61817 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_mf8(mfloat8x8_t __p0) { 61818 int32x2_t __ret; 61819 __ret = (int32x2_t)(__p0); 61820 return __ret; 61821 } 61822 __ai __attribute__((target("neon"))) int32x2_t vreinterpret_s32_s16(int16x4_t __p0) { 61823 int32x2_t __ret; 61824 __ret = (int32x2_t)(__p0); 61825 return __ret; 61826 } 61827 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_p8(poly8x8_t __p0) { 61828 int64x1_t __ret; 61829 __ret = (int64x1_t)(__p0); 61830 return __ret; 61831 } 61832 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_p64(poly64x1_t __p0) { 61833 int64x1_t __ret; 61834 __ret = (int64x1_t)(__p0); 61835 return __ret; 61836 } 61837 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_p16(poly16x4_t __p0) { 61838 int64x1_t __ret; 61839 __ret = (int64x1_t)(__p0); 61840 return __ret; 61841 } 61842 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_u8(uint8x8_t __p0) { 61843 int64x1_t __ret; 61844 __ret = (int64x1_t)(__p0); 61845 return __ret; 61846 } 61847 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_u32(uint32x2_t __p0) { 61848 int64x1_t __ret; 61849 __ret = (int64x1_t)(__p0); 61850 return __ret; 61851 } 61852 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_u64(uint64x1_t __p0) { 61853 int64x1_t __ret; 61854 __ret = (int64x1_t)(__p0); 61855 return __ret; 61856 } 61857 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_u16(uint16x4_t __p0) { 61858 int64x1_t __ret; 61859 __ret = (int64x1_t)(__p0); 61860 return __ret; 61861 } 61862 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_s8(int8x8_t __p0) { 61863 int64x1_t __ret; 61864 __ret = (int64x1_t)(__p0); 61865 return __ret; 61866 } 61867 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_f64(float64x1_t __p0) { 61868 int64x1_t __ret; 61869 __ret = (int64x1_t)(__p0); 61870 return __ret; 61871 } 61872 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_f32(float32x2_t __p0) { 61873 int64x1_t __ret; 61874 __ret = (int64x1_t)(__p0); 61875 return __ret; 61876 } 61877 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_f16(float16x4_t __p0) { 61878 int64x1_t __ret; 61879 __ret = (int64x1_t)(__p0); 61880 return __ret; 61881 } 61882 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_s32(int32x2_t __p0) { 61883 int64x1_t __ret; 61884 __ret = (int64x1_t)(__p0); 61885 return __ret; 61886 } 61887 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_mf8(mfloat8x8_t __p0) { 61888 int64x1_t __ret; 61889 __ret = (int64x1_t)(__p0); 61890 return __ret; 61891 } 61892 __ai __attribute__((target("neon"))) int64x1_t vreinterpret_s64_s16(int16x4_t __p0) { 61893 int64x1_t __ret; 61894 __ret = (int64x1_t)(__p0); 61895 return __ret; 61896 } 61897 __ai __attribute__((target("neon"))) mfloat8x8_t vreinterpret_mf8_p8(poly8x8_t __p0) { 61898 mfloat8x8_t __ret; 61899 __ret = (mfloat8x8_t)(__p0); 61900 return __ret; 61901 } 61902 __ai __attribute__((target("neon"))) mfloat8x8_t vreinterpret_mf8_p64(poly64x1_t __p0) { 61903 mfloat8x8_t __ret; 61904 __ret = (mfloat8x8_t)(__p0); 61905 return __ret; 61906 } 61907 __ai __attribute__((target("neon"))) mfloat8x8_t vreinterpret_mf8_p16(poly16x4_t __p0) { 61908 mfloat8x8_t __ret; 61909 __ret = (mfloat8x8_t)(__p0); 61910 return __ret; 61911 } 61912 __ai __attribute__((target("neon"))) mfloat8x8_t vreinterpret_mf8_u8(uint8x8_t __p0) { 61913 mfloat8x8_t __ret; 61914 __ret = (mfloat8x8_t)(__p0); 61915 return __ret; 61916 } 61917 __ai __attribute__((target("neon"))) mfloat8x8_t vreinterpret_mf8_u32(uint32x2_t __p0) { 61918 mfloat8x8_t __ret; 61919 __ret = (mfloat8x8_t)(__p0); 61920 return __ret; 61921 } 61922 __ai __attribute__((target("neon"))) mfloat8x8_t vreinterpret_mf8_u64(uint64x1_t __p0) { 61923 mfloat8x8_t __ret; 61924 __ret = (mfloat8x8_t)(__p0); 61925 return __ret; 61926 } 61927 __ai __attribute__((target("neon"))) mfloat8x8_t vreinterpret_mf8_u16(uint16x4_t __p0) { 61928 mfloat8x8_t __ret; 61929 __ret = (mfloat8x8_t)(__p0); 61930 return __ret; 61931 } 61932 __ai __attribute__((target("neon"))) mfloat8x8_t vreinterpret_mf8_s8(int8x8_t __p0) { 61933 mfloat8x8_t __ret; 61934 __ret = (mfloat8x8_t)(__p0); 61935 return __ret; 61936 } 61937 __ai __attribute__((target("neon"))) mfloat8x8_t vreinterpret_mf8_f64(float64x1_t __p0) { 61938 mfloat8x8_t __ret; 61939 __ret = (mfloat8x8_t)(__p0); 61940 return __ret; 61941 } 61942 __ai __attribute__((target("neon"))) mfloat8x8_t vreinterpret_mf8_f32(float32x2_t __p0) { 61943 mfloat8x8_t __ret; 61944 __ret = (mfloat8x8_t)(__p0); 61945 return __ret; 61946 } 61947 __ai __attribute__((target("neon"))) mfloat8x8_t vreinterpret_mf8_f16(float16x4_t __p0) { 61948 mfloat8x8_t __ret; 61949 __ret = (mfloat8x8_t)(__p0); 61950 return __ret; 61951 } 61952 __ai __attribute__((target("neon"))) mfloat8x8_t vreinterpret_mf8_s32(int32x2_t __p0) { 61953 mfloat8x8_t __ret; 61954 __ret = (mfloat8x8_t)(__p0); 61955 return __ret; 61956 } 61957 __ai __attribute__((target("neon"))) mfloat8x8_t vreinterpret_mf8_s64(int64x1_t __p0) { 61958 mfloat8x8_t __ret; 61959 __ret = (mfloat8x8_t)(__p0); 61960 return __ret; 61961 } 61962 __ai __attribute__((target("neon"))) mfloat8x8_t vreinterpret_mf8_s16(int16x4_t __p0) { 61963 mfloat8x8_t __ret; 61964 __ret = (mfloat8x8_t)(__p0); 61965 return __ret; 61966 } 61967 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_p8(poly8x8_t __p0) { 61968 int16x4_t __ret; 61969 __ret = (int16x4_t)(__p0); 61970 return __ret; 61971 } 61972 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_p64(poly64x1_t __p0) { 61973 int16x4_t __ret; 61974 __ret = (int16x4_t)(__p0); 61975 return __ret; 61976 } 61977 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_p16(poly16x4_t __p0) { 61978 int16x4_t __ret; 61979 __ret = (int16x4_t)(__p0); 61980 return __ret; 61981 } 61982 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_u8(uint8x8_t __p0) { 61983 int16x4_t __ret; 61984 __ret = (int16x4_t)(__p0); 61985 return __ret; 61986 } 61987 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_u32(uint32x2_t __p0) { 61988 int16x4_t __ret; 61989 __ret = (int16x4_t)(__p0); 61990 return __ret; 61991 } 61992 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_u64(uint64x1_t __p0) { 61993 int16x4_t __ret; 61994 __ret = (int16x4_t)(__p0); 61995 return __ret; 61996 } 61997 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_u16(uint16x4_t __p0) { 61998 int16x4_t __ret; 61999 __ret = (int16x4_t)(__p0); 62000 return __ret; 62001 } 62002 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_s8(int8x8_t __p0) { 62003 int16x4_t __ret; 62004 __ret = (int16x4_t)(__p0); 62005 return __ret; 62006 } 62007 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_f64(float64x1_t __p0) { 62008 int16x4_t __ret; 62009 __ret = (int16x4_t)(__p0); 62010 return __ret; 62011 } 62012 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_f32(float32x2_t __p0) { 62013 int16x4_t __ret; 62014 __ret = (int16x4_t)(__p0); 62015 return __ret; 62016 } 62017 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_f16(float16x4_t __p0) { 62018 int16x4_t __ret; 62019 __ret = (int16x4_t)(__p0); 62020 return __ret; 62021 } 62022 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_s32(int32x2_t __p0) { 62023 int16x4_t __ret; 62024 __ret = (int16x4_t)(__p0); 62025 return __ret; 62026 } 62027 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_s64(int64x1_t __p0) { 62028 int16x4_t __ret; 62029 __ret = (int16x4_t)(__p0); 62030 return __ret; 62031 } 62032 __ai __attribute__((target("neon"))) int16x4_t vreinterpret_s16_mf8(mfloat8x8_t __p0) { 62033 int16x4_t __ret; 62034 __ret = (int16x4_t)(__p0); 62035 return __ret; 62036 } 62037 __ai __attribute__((target("neon"))) uint64_t vrshld_u64(uint64_t __p0, int64_t __p1) { 62038 uint64_t __ret; 62039 __ret = (uint64_t) __builtin_neon_vrshld_u64(__p0, __p1); 62040 return __ret; 62041 } 62042 __ai __attribute__((target("neon"))) int64_t vrshld_s64(int64_t __p0, int64_t __p1) { 62043 int64_t __ret; 62044 __ret = (int64_t) __builtin_neon_vrshld_s64(__p0, __p1); 62045 return __ret; 62046 } 62047 #define vrshrd_n_u64(__p0, __p1) __extension__ ({ \ 62048 uint64_t __ret; \ 62049 uint64_t __s0 = __p0; \ 62050 __ret = (uint64_t) __builtin_neon_vrshrd_n_u64(__s0, __p1); \ 62051 __ret; \ 62052 }) 62053 #define vrshrd_n_s64(__p0, __p1) __extension__ ({ \ 62054 int64_t __ret; \ 62055 int64_t __s0 = __p0; \ 62056 __ret = (int64_t) __builtin_neon_vrshrd_n_s64(__s0, __p1); \ 62057 __ret; \ 62058 }) 62059 #ifdef __LITTLE_ENDIAN__ 62060 #define vrshrn_high_n_u32(__p0_724, __p1_724, __p2_724) __extension__ ({ \ 62061 uint16x8_t __ret_724; \ 62062 uint16x4_t __s0_724 = __p0_724; \ 62063 uint32x4_t __s1_724 = __p1_724; \ 62064 __ret_724 = (uint16x8_t)(vcombine_u16((uint16x4_t)(__s0_724), (uint16x4_t)(vrshrn_n_u32(__s1_724, __p2_724)))); \ 62065 __ret_724; \ 62066 }) 62067 #else 62068 #define vrshrn_high_n_u32(__p0_725, __p1_725, __p2_725) __extension__ ({ \ 62069 uint16x8_t __ret_725; \ 62070 uint16x4_t __s0_725 = __p0_725; \ 62071 uint32x4_t __s1_725 = __p1_725; \ 62072 uint16x4_t __rev0_725; __rev0_725 = __builtin_shufflevector(__s0_725, __s0_725, 3, 2, 1, 0); \ 62073 uint32x4_t __rev1_725; __rev1_725 = __builtin_shufflevector(__s1_725, __s1_725, 3, 2, 1, 0); \ 62074 __ret_725 = (uint16x8_t)(__noswap_vcombine_u16((uint16x4_t)(__rev0_725), (uint16x4_t)(__noswap_vrshrn_n_u32(__rev1_725, __p2_725)))); \ 62075 __ret_725 = __builtin_shufflevector(__ret_725, __ret_725, 7, 6, 5, 4, 3, 2, 1, 0); \ 62076 __ret_725; \ 62077 }) 62078 #endif 62079 62080 #ifdef __LITTLE_ENDIAN__ 62081 #define vrshrn_high_n_u64(__p0_726, __p1_726, __p2_726) __extension__ ({ \ 62082 uint32x4_t __ret_726; \ 62083 uint32x2_t __s0_726 = __p0_726; \ 62084 uint64x2_t __s1_726 = __p1_726; \ 62085 __ret_726 = (uint32x4_t)(vcombine_u32((uint32x2_t)(__s0_726), (uint32x2_t)(vrshrn_n_u64(__s1_726, __p2_726)))); \ 62086 __ret_726; \ 62087 }) 62088 #else 62089 #define vrshrn_high_n_u64(__p0_727, __p1_727, __p2_727) __extension__ ({ \ 62090 uint32x4_t __ret_727; \ 62091 uint32x2_t __s0_727 = __p0_727; \ 62092 uint64x2_t __s1_727 = __p1_727; \ 62093 uint32x2_t __rev0_727; __rev0_727 = __builtin_shufflevector(__s0_727, __s0_727, 1, 0); \ 62094 uint64x2_t __rev1_727; __rev1_727 = __builtin_shufflevector(__s1_727, __s1_727, 1, 0); \ 62095 __ret_727 = (uint32x4_t)(__noswap_vcombine_u32((uint32x2_t)(__rev0_727), (uint32x2_t)(__noswap_vrshrn_n_u64(__rev1_727, __p2_727)))); \ 62096 __ret_727 = __builtin_shufflevector(__ret_727, __ret_727, 3, 2, 1, 0); \ 62097 __ret_727; \ 62098 }) 62099 #endif 62100 62101 #ifdef __LITTLE_ENDIAN__ 62102 #define vrshrn_high_n_u16(__p0_728, __p1_728, __p2_728) __extension__ ({ \ 62103 uint8x16_t __ret_728; \ 62104 uint8x8_t __s0_728 = __p0_728; \ 62105 uint16x8_t __s1_728 = __p1_728; \ 62106 __ret_728 = (uint8x16_t)(vcombine_u8((uint8x8_t)(__s0_728), (uint8x8_t)(vrshrn_n_u16(__s1_728, __p2_728)))); \ 62107 __ret_728; \ 62108 }) 62109 #else 62110 #define vrshrn_high_n_u16(__p0_729, __p1_729, __p2_729) __extension__ ({ \ 62111 uint8x16_t __ret_729; \ 62112 uint8x8_t __s0_729 = __p0_729; \ 62113 uint16x8_t __s1_729 = __p1_729; \ 62114 uint8x8_t __rev0_729; __rev0_729 = __builtin_shufflevector(__s0_729, __s0_729, 7, 6, 5, 4, 3, 2, 1, 0); \ 62115 uint16x8_t __rev1_729; __rev1_729 = __builtin_shufflevector(__s1_729, __s1_729, 7, 6, 5, 4, 3, 2, 1, 0); \ 62116 __ret_729 = (uint8x16_t)(__noswap_vcombine_u8((uint8x8_t)(__rev0_729), (uint8x8_t)(__noswap_vrshrn_n_u16(__rev1_729, __p2_729)))); \ 62117 __ret_729 = __builtin_shufflevector(__ret_729, __ret_729, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 62118 __ret_729; \ 62119 }) 62120 #endif 62121 62122 #ifdef __LITTLE_ENDIAN__ 62123 #define vrshrn_high_n_s32(__p0_730, __p1_730, __p2_730) __extension__ ({ \ 62124 int16x8_t __ret_730; \ 62125 int16x4_t __s0_730 = __p0_730; \ 62126 int32x4_t __s1_730 = __p1_730; \ 62127 __ret_730 = (int16x8_t)(vcombine_s16((int16x4_t)(__s0_730), (int16x4_t)(vrshrn_n_s32(__s1_730, __p2_730)))); \ 62128 __ret_730; \ 62129 }) 62130 #else 62131 #define vrshrn_high_n_s32(__p0_731, __p1_731, __p2_731) __extension__ ({ \ 62132 int16x8_t __ret_731; \ 62133 int16x4_t __s0_731 = __p0_731; \ 62134 int32x4_t __s1_731 = __p1_731; \ 62135 int16x4_t __rev0_731; __rev0_731 = __builtin_shufflevector(__s0_731, __s0_731, 3, 2, 1, 0); \ 62136 int32x4_t __rev1_731; __rev1_731 = __builtin_shufflevector(__s1_731, __s1_731, 3, 2, 1, 0); \ 62137 __ret_731 = (int16x8_t)(__noswap_vcombine_s16((int16x4_t)(__rev0_731), (int16x4_t)(__noswap_vrshrn_n_s32(__rev1_731, __p2_731)))); \ 62138 __ret_731 = __builtin_shufflevector(__ret_731, __ret_731, 7, 6, 5, 4, 3, 2, 1, 0); \ 62139 __ret_731; \ 62140 }) 62141 #endif 62142 62143 #ifdef __LITTLE_ENDIAN__ 62144 #define vrshrn_high_n_s64(__p0_732, __p1_732, __p2_732) __extension__ ({ \ 62145 int32x4_t __ret_732; \ 62146 int32x2_t __s0_732 = __p0_732; \ 62147 int64x2_t __s1_732 = __p1_732; \ 62148 __ret_732 = (int32x4_t)(vcombine_s32((int32x2_t)(__s0_732), (int32x2_t)(vrshrn_n_s64(__s1_732, __p2_732)))); \ 62149 __ret_732; \ 62150 }) 62151 #else 62152 #define vrshrn_high_n_s64(__p0_733, __p1_733, __p2_733) __extension__ ({ \ 62153 int32x4_t __ret_733; \ 62154 int32x2_t __s0_733 = __p0_733; \ 62155 int64x2_t __s1_733 = __p1_733; \ 62156 int32x2_t __rev0_733; __rev0_733 = __builtin_shufflevector(__s0_733, __s0_733, 1, 0); \ 62157 int64x2_t __rev1_733; __rev1_733 = __builtin_shufflevector(__s1_733, __s1_733, 1, 0); \ 62158 __ret_733 = (int32x4_t)(__noswap_vcombine_s32((int32x2_t)(__rev0_733), (int32x2_t)(__noswap_vrshrn_n_s64(__rev1_733, __p2_733)))); \ 62159 __ret_733 = __builtin_shufflevector(__ret_733, __ret_733, 3, 2, 1, 0); \ 62160 __ret_733; \ 62161 }) 62162 #endif 62163 62164 #ifdef __LITTLE_ENDIAN__ 62165 #define vrshrn_high_n_s16(__p0_734, __p1_734, __p2_734) __extension__ ({ \ 62166 int8x16_t __ret_734; \ 62167 int8x8_t __s0_734 = __p0_734; \ 62168 int16x8_t __s1_734 = __p1_734; \ 62169 __ret_734 = (int8x16_t)(vcombine_s8((int8x8_t)(__s0_734), (int8x8_t)(vrshrn_n_s16(__s1_734, __p2_734)))); \ 62170 __ret_734; \ 62171 }) 62172 #else 62173 #define vrshrn_high_n_s16(__p0_735, __p1_735, __p2_735) __extension__ ({ \ 62174 int8x16_t __ret_735; \ 62175 int8x8_t __s0_735 = __p0_735; \ 62176 int16x8_t __s1_735 = __p1_735; \ 62177 int8x8_t __rev0_735; __rev0_735 = __builtin_shufflevector(__s0_735, __s0_735, 7, 6, 5, 4, 3, 2, 1, 0); \ 62178 int16x8_t __rev1_735; __rev1_735 = __builtin_shufflevector(__s1_735, __s1_735, 7, 6, 5, 4, 3, 2, 1, 0); \ 62179 __ret_735 = (int8x16_t)(__noswap_vcombine_s8((int8x8_t)(__rev0_735), (int8x8_t)(__noswap_vrshrn_n_s16(__rev1_735, __p2_735)))); \ 62180 __ret_735 = __builtin_shufflevector(__ret_735, __ret_735, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 62181 __ret_735; \ 62182 }) 62183 #endif 62184 62185 #ifdef __LITTLE_ENDIAN__ 62186 __ai __attribute__((target("neon"))) float64x2_t vrsqrteq_f64(float64x2_t __p0) { 62187 float64x2_t __ret; 62188 __ret = (float64x2_t) __builtin_neon_vrsqrteq_v((int8x16_t)__p0, 42); 62189 return __ret; 62190 } 62191 #else 62192 __ai __attribute__((target("neon"))) float64x2_t vrsqrteq_f64(float64x2_t __p0) { 62193 float64x2_t __ret; 62194 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 62195 __ret = (float64x2_t) __builtin_neon_vrsqrteq_v((int8x16_t)__rev0, 42); 62196 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 62197 return __ret; 62198 } 62199 #endif 62200 62201 __ai __attribute__((target("neon"))) float64x1_t vrsqrte_f64(float64x1_t __p0) { 62202 float64x1_t __ret; 62203 __ret = (float64x1_t) __builtin_neon_vrsqrte_v((int8x8_t)__p0, 10); 62204 return __ret; 62205 } 62206 __ai __attribute__((target("neon"))) float64_t vrsqrted_f64(float64_t __p0) { 62207 float64_t __ret; 62208 __ret = (float64_t) __builtin_neon_vrsqrted_f64(__p0); 62209 return __ret; 62210 } 62211 __ai __attribute__((target("neon"))) float32_t vrsqrtes_f32(float32_t __p0) { 62212 float32_t __ret; 62213 __ret = (float32_t) __builtin_neon_vrsqrtes_f32(__p0); 62214 return __ret; 62215 } 62216 #ifdef __LITTLE_ENDIAN__ 62217 __ai __attribute__((target("neon"))) float64x2_t vrsqrtsq_f64(float64x2_t __p0, float64x2_t __p1) { 62218 float64x2_t __ret; 62219 __ret = (float64x2_t) __builtin_neon_vrsqrtsq_v((int8x16_t)__p0, (int8x16_t)__p1, 42); 62220 return __ret; 62221 } 62222 #else 62223 __ai __attribute__((target("neon"))) float64x2_t vrsqrtsq_f64(float64x2_t __p0, float64x2_t __p1) { 62224 float64x2_t __ret; 62225 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 62226 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 62227 __ret = (float64x2_t) __builtin_neon_vrsqrtsq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 42); 62228 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 62229 return __ret; 62230 } 62231 #endif 62232 62233 __ai __attribute__((target("neon"))) float64x1_t vrsqrts_f64(float64x1_t __p0, float64x1_t __p1) { 62234 float64x1_t __ret; 62235 __ret = (float64x1_t) __builtin_neon_vrsqrts_v((int8x8_t)__p0, (int8x8_t)__p1, 10); 62236 return __ret; 62237 } 62238 __ai __attribute__((target("neon"))) float64_t vrsqrtsd_f64(float64_t __p0, float64_t __p1) { 62239 float64_t __ret; 62240 __ret = (float64_t) __builtin_neon_vrsqrtsd_f64(__p0, __p1); 62241 return __ret; 62242 } 62243 __ai __attribute__((target("neon"))) float32_t vrsqrtss_f32(float32_t __p0, float32_t __p1) { 62244 float32_t __ret; 62245 __ret = (float32_t) __builtin_neon_vrsqrtss_f32(__p0, __p1); 62246 return __ret; 62247 } 62248 #define vrsrad_n_u64(__p0, __p1, __p2) __extension__ ({ \ 62249 uint64_t __ret; \ 62250 uint64_t __s0 = __p0; \ 62251 uint64_t __s1 = __p1; \ 62252 __ret = (uint64_t) __builtin_neon_vrsrad_n_u64(__s0, __s1, __p2); \ 62253 __ret; \ 62254 }) 62255 #define vrsrad_n_s64(__p0, __p1, __p2) __extension__ ({ \ 62256 int64_t __ret; \ 62257 int64_t __s0 = __p0; \ 62258 int64_t __s1 = __p1; \ 62259 __ret = (int64_t) __builtin_neon_vrsrad_n_s64(__s0, __s1, __p2); \ 62260 __ret; \ 62261 }) 62262 #ifdef __LITTLE_ENDIAN__ 62263 __ai __attribute__((target("neon"))) uint16x8_t vrsubhn_high_u32(uint16x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 62264 uint16x8_t __ret; 62265 __ret = vcombine_u16(__p0, vrsubhn_u32(__p1, __p2)); 62266 return __ret; 62267 } 62268 #else 62269 __ai __attribute__((target("neon"))) uint16x8_t vrsubhn_high_u32(uint16x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 62270 uint16x8_t __ret; 62271 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 62272 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 62273 uint32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 62274 __ret = __noswap_vcombine_u16(__rev0, __noswap_vrsubhn_u32(__rev1, __rev2)); 62275 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 62276 return __ret; 62277 } 62278 #endif 62279 62280 #ifdef __LITTLE_ENDIAN__ 62281 __ai __attribute__((target("neon"))) uint32x4_t vrsubhn_high_u64(uint32x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) { 62282 uint32x4_t __ret; 62283 __ret = vcombine_u32(__p0, vrsubhn_u64(__p1, __p2)); 62284 return __ret; 62285 } 62286 #else 62287 __ai __attribute__((target("neon"))) uint32x4_t vrsubhn_high_u64(uint32x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) { 62288 uint32x4_t __ret; 62289 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 62290 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 62291 uint64x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 62292 __ret = __noswap_vcombine_u32(__rev0, __noswap_vrsubhn_u64(__rev1, __rev2)); 62293 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 62294 return __ret; 62295 } 62296 #endif 62297 62298 #ifdef __LITTLE_ENDIAN__ 62299 __ai __attribute__((target("neon"))) uint8x16_t vrsubhn_high_u16(uint8x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) { 62300 uint8x16_t __ret; 62301 __ret = vcombine_u8(__p0, vrsubhn_u16(__p1, __p2)); 62302 return __ret; 62303 } 62304 #else 62305 __ai __attribute__((target("neon"))) uint8x16_t vrsubhn_high_u16(uint8x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) { 62306 uint8x16_t __ret; 62307 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 62308 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 62309 uint16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 62310 __ret = __noswap_vcombine_u8(__rev0, __noswap_vrsubhn_u16(__rev1, __rev2)); 62311 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 62312 return __ret; 62313 } 62314 #endif 62315 62316 #ifdef __LITTLE_ENDIAN__ 62317 __ai __attribute__((target("neon"))) int16x8_t vrsubhn_high_s32(int16x4_t __p0, int32x4_t __p1, int32x4_t __p2) { 62318 int16x8_t __ret; 62319 __ret = vcombine_s16(__p0, vrsubhn_s32(__p1, __p2)); 62320 return __ret; 62321 } 62322 #else 62323 __ai __attribute__((target("neon"))) int16x8_t vrsubhn_high_s32(int16x4_t __p0, int32x4_t __p1, int32x4_t __p2) { 62324 int16x8_t __ret; 62325 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 62326 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 62327 int32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 62328 __ret = __noswap_vcombine_s16(__rev0, __noswap_vrsubhn_s32(__rev1, __rev2)); 62329 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 62330 return __ret; 62331 } 62332 #endif 62333 62334 #ifdef __LITTLE_ENDIAN__ 62335 __ai __attribute__((target("neon"))) int32x4_t vrsubhn_high_s64(int32x2_t __p0, int64x2_t __p1, int64x2_t __p2) { 62336 int32x4_t __ret; 62337 __ret = vcombine_s32(__p0, vrsubhn_s64(__p1, __p2)); 62338 return __ret; 62339 } 62340 #else 62341 __ai __attribute__((target("neon"))) int32x4_t vrsubhn_high_s64(int32x2_t __p0, int64x2_t __p1, int64x2_t __p2) { 62342 int32x4_t __ret; 62343 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 62344 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 62345 int64x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 62346 __ret = __noswap_vcombine_s32(__rev0, __noswap_vrsubhn_s64(__rev1, __rev2)); 62347 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 62348 return __ret; 62349 } 62350 #endif 62351 62352 #ifdef __LITTLE_ENDIAN__ 62353 __ai __attribute__((target("neon"))) int8x16_t vrsubhn_high_s16(int8x8_t __p0, int16x8_t __p1, int16x8_t __p2) { 62354 int8x16_t __ret; 62355 __ret = vcombine_s8(__p0, vrsubhn_s16(__p1, __p2)); 62356 return __ret; 62357 } 62358 #else 62359 __ai __attribute__((target("neon"))) int8x16_t vrsubhn_high_s16(int8x8_t __p0, int16x8_t __p1, int16x8_t __p2) { 62360 int8x16_t __ret; 62361 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 62362 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 62363 int16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 62364 __ret = __noswap_vcombine_s8(__rev0, __noswap_vrsubhn_s16(__rev1, __rev2)); 62365 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 62366 return __ret; 62367 } 62368 #endif 62369 62370 #define vset_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 62371 poly64x1_t __ret; \ 62372 poly64_t __s0 = __p0; \ 62373 poly64x1_t __s1 = __p1; \ 62374 __ret = (poly64x1_t) __builtin_neon_vset_lane_i64(__s0, (poly64x1_t)__s1, __p2); \ 62375 __ret; \ 62376 }) 62377 #ifdef __LITTLE_ENDIAN__ 62378 #define vsetq_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 62379 poly64x2_t __ret; \ 62380 poly64_t __s0 = __p0; \ 62381 poly64x2_t __s1 = __p1; \ 62382 __ret = (poly64x2_t) __builtin_neon_vsetq_lane_i64(__s0, (poly64x2_t)__s1, __p2); \ 62383 __ret; \ 62384 }) 62385 #else 62386 #define vsetq_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 62387 poly64x2_t __ret; \ 62388 poly64_t __s0 = __p0; \ 62389 poly64x2_t __s1 = __p1; \ 62390 poly64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 62391 __ret = (poly64x2_t) __builtin_neon_vsetq_lane_i64(__s0, (poly64x2_t)__rev1, __p2); \ 62392 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 62393 __ret; \ 62394 }) 62395 #define __noswap_vsetq_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 62396 poly64x2_t __ret; \ 62397 poly64_t __s0 = __p0; \ 62398 poly64x2_t __s1 = __p1; \ 62399 __ret = (poly64x2_t) __builtin_neon_vsetq_lane_i64(__s0, (poly64x2_t)__s1, __p2); \ 62400 __ret; \ 62401 }) 62402 #endif 62403 62404 #ifdef __LITTLE_ENDIAN__ 62405 #define vsetq_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 62406 float64x2_t __ret; \ 62407 float64_t __s0 = __p0; \ 62408 float64x2_t __s1 = __p1; \ 62409 __ret = (float64x2_t) __builtin_neon_vsetq_lane_f64(__s0, (float64x2_t)__s1, __p2); \ 62410 __ret; \ 62411 }) 62412 #else 62413 #define vsetq_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 62414 float64x2_t __ret; \ 62415 float64_t __s0 = __p0; \ 62416 float64x2_t __s1 = __p1; \ 62417 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 62418 __ret = (float64x2_t) __builtin_neon_vsetq_lane_f64(__s0, (float64x2_t)__rev1, __p2); \ 62419 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 62420 __ret; \ 62421 }) 62422 #define __noswap_vsetq_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 62423 float64x2_t __ret; \ 62424 float64_t __s0 = __p0; \ 62425 float64x2_t __s1 = __p1; \ 62426 __ret = (float64x2_t) __builtin_neon_vsetq_lane_f64(__s0, (float64x2_t)__s1, __p2); \ 62427 __ret; \ 62428 }) 62429 #endif 62430 62431 #define vset_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 62432 float64x1_t __ret; \ 62433 float64_t __s0 = __p0; \ 62434 float64x1_t __s1 = __p1; \ 62435 __ret = (float64x1_t) __builtin_neon_vset_lane_f64(__s0, (float64x1_t)__s1, __p2); \ 62436 __ret; \ 62437 }) 62438 __ai __attribute__((target("neon"))) uint64_t vshld_u64(uint64_t __p0, int64_t __p1) { 62439 uint64_t __ret; 62440 __ret = (uint64_t) __builtin_neon_vshld_u64(__p0, __p1); 62441 return __ret; 62442 } 62443 __ai __attribute__((target("neon"))) int64_t vshld_s64(int64_t __p0, int64_t __p1) { 62444 int64_t __ret; 62445 __ret = (int64_t) __builtin_neon_vshld_s64(__p0, __p1); 62446 return __ret; 62447 } 62448 #define vshld_n_u64(__p0, __p1) __extension__ ({ \ 62449 uint64_t __ret; \ 62450 uint64_t __s0 = __p0; \ 62451 __ret = (uint64_t) __builtin_neon_vshld_n_u64(__s0, __p1); \ 62452 __ret; \ 62453 }) 62454 #define vshld_n_s64(__p0, __p1) __extension__ ({ \ 62455 int64_t __ret; \ 62456 int64_t __s0 = __p0; \ 62457 __ret = (int64_t) __builtin_neon_vshld_n_s64(__s0, __p1); \ 62458 __ret; \ 62459 }) 62460 #ifdef __LITTLE_ENDIAN__ 62461 #define vshll_high_n_u8(__p0_736, __p1_736) __extension__ ({ \ 62462 uint16x8_t __ret_736; \ 62463 uint8x16_t __s0_736 = __p0_736; \ 62464 __ret_736 = (uint16x8_t)(vshll_n_u8(vget_high_u8(__s0_736), __p1_736)); \ 62465 __ret_736; \ 62466 }) 62467 #else 62468 #define vshll_high_n_u8(__p0_737, __p1_737) __extension__ ({ \ 62469 uint16x8_t __ret_737; \ 62470 uint8x16_t __s0_737 = __p0_737; \ 62471 uint8x16_t __rev0_737; __rev0_737 = __builtin_shufflevector(__s0_737, __s0_737, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 62472 __ret_737 = (uint16x8_t)(__noswap_vshll_n_u8(__noswap_vget_high_u8(__rev0_737), __p1_737)); \ 62473 __ret_737 = __builtin_shufflevector(__ret_737, __ret_737, 7, 6, 5, 4, 3, 2, 1, 0); \ 62474 __ret_737; \ 62475 }) 62476 #endif 62477 62478 #ifdef __LITTLE_ENDIAN__ 62479 #define vshll_high_n_u32(__p0_738, __p1_738) __extension__ ({ \ 62480 uint64x2_t __ret_738; \ 62481 uint32x4_t __s0_738 = __p0_738; \ 62482 __ret_738 = (uint64x2_t)(vshll_n_u32(vget_high_u32(__s0_738), __p1_738)); \ 62483 __ret_738; \ 62484 }) 62485 #else 62486 #define vshll_high_n_u32(__p0_739, __p1_739) __extension__ ({ \ 62487 uint64x2_t __ret_739; \ 62488 uint32x4_t __s0_739 = __p0_739; \ 62489 uint32x4_t __rev0_739; __rev0_739 = __builtin_shufflevector(__s0_739, __s0_739, 3, 2, 1, 0); \ 62490 __ret_739 = (uint64x2_t)(__noswap_vshll_n_u32(__noswap_vget_high_u32(__rev0_739), __p1_739)); \ 62491 __ret_739 = __builtin_shufflevector(__ret_739, __ret_739, 1, 0); \ 62492 __ret_739; \ 62493 }) 62494 #endif 62495 62496 #ifdef __LITTLE_ENDIAN__ 62497 #define vshll_high_n_u16(__p0_740, __p1_740) __extension__ ({ \ 62498 uint32x4_t __ret_740; \ 62499 uint16x8_t __s0_740 = __p0_740; \ 62500 __ret_740 = (uint32x4_t)(vshll_n_u16(vget_high_u16(__s0_740), __p1_740)); \ 62501 __ret_740; \ 62502 }) 62503 #else 62504 #define vshll_high_n_u16(__p0_741, __p1_741) __extension__ ({ \ 62505 uint32x4_t __ret_741; \ 62506 uint16x8_t __s0_741 = __p0_741; \ 62507 uint16x8_t __rev0_741; __rev0_741 = __builtin_shufflevector(__s0_741, __s0_741, 7, 6, 5, 4, 3, 2, 1, 0); \ 62508 __ret_741 = (uint32x4_t)(__noswap_vshll_n_u16(__noswap_vget_high_u16(__rev0_741), __p1_741)); \ 62509 __ret_741 = __builtin_shufflevector(__ret_741, __ret_741, 3, 2, 1, 0); \ 62510 __ret_741; \ 62511 }) 62512 #endif 62513 62514 #ifdef __LITTLE_ENDIAN__ 62515 #define vshll_high_n_s8(__p0_742, __p1_742) __extension__ ({ \ 62516 int16x8_t __ret_742; \ 62517 int8x16_t __s0_742 = __p0_742; \ 62518 __ret_742 = (int16x8_t)(vshll_n_s8(vget_high_s8(__s0_742), __p1_742)); \ 62519 __ret_742; \ 62520 }) 62521 #else 62522 #define vshll_high_n_s8(__p0_743, __p1_743) __extension__ ({ \ 62523 int16x8_t __ret_743; \ 62524 int8x16_t __s0_743 = __p0_743; \ 62525 int8x16_t __rev0_743; __rev0_743 = __builtin_shufflevector(__s0_743, __s0_743, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 62526 __ret_743 = (int16x8_t)(__noswap_vshll_n_s8(__noswap_vget_high_s8(__rev0_743), __p1_743)); \ 62527 __ret_743 = __builtin_shufflevector(__ret_743, __ret_743, 7, 6, 5, 4, 3, 2, 1, 0); \ 62528 __ret_743; \ 62529 }) 62530 #endif 62531 62532 #ifdef __LITTLE_ENDIAN__ 62533 #define vshll_high_n_s32(__p0_744, __p1_744) __extension__ ({ \ 62534 int64x2_t __ret_744; \ 62535 int32x4_t __s0_744 = __p0_744; \ 62536 __ret_744 = (int64x2_t)(vshll_n_s32(vget_high_s32(__s0_744), __p1_744)); \ 62537 __ret_744; \ 62538 }) 62539 #else 62540 #define vshll_high_n_s32(__p0_745, __p1_745) __extension__ ({ \ 62541 int64x2_t __ret_745; \ 62542 int32x4_t __s0_745 = __p0_745; \ 62543 int32x4_t __rev0_745; __rev0_745 = __builtin_shufflevector(__s0_745, __s0_745, 3, 2, 1, 0); \ 62544 __ret_745 = (int64x2_t)(__noswap_vshll_n_s32(__noswap_vget_high_s32(__rev0_745), __p1_745)); \ 62545 __ret_745 = __builtin_shufflevector(__ret_745, __ret_745, 1, 0); \ 62546 __ret_745; \ 62547 }) 62548 #endif 62549 62550 #ifdef __LITTLE_ENDIAN__ 62551 #define vshll_high_n_s16(__p0_746, __p1_746) __extension__ ({ \ 62552 int32x4_t __ret_746; \ 62553 int16x8_t __s0_746 = __p0_746; \ 62554 __ret_746 = (int32x4_t)(vshll_n_s16(vget_high_s16(__s0_746), __p1_746)); \ 62555 __ret_746; \ 62556 }) 62557 #else 62558 #define vshll_high_n_s16(__p0_747, __p1_747) __extension__ ({ \ 62559 int32x4_t __ret_747; \ 62560 int16x8_t __s0_747 = __p0_747; \ 62561 int16x8_t __rev0_747; __rev0_747 = __builtin_shufflevector(__s0_747, __s0_747, 7, 6, 5, 4, 3, 2, 1, 0); \ 62562 __ret_747 = (int32x4_t)(__noswap_vshll_n_s16(__noswap_vget_high_s16(__rev0_747), __p1_747)); \ 62563 __ret_747 = __builtin_shufflevector(__ret_747, __ret_747, 3, 2, 1, 0); \ 62564 __ret_747; \ 62565 }) 62566 #endif 62567 62568 #define vshrd_n_u64(__p0, __p1) __extension__ ({ \ 62569 uint64_t __ret; \ 62570 uint64_t __s0 = __p0; \ 62571 __ret = (uint64_t) __builtin_neon_vshrd_n_u64(__s0, __p1); \ 62572 __ret; \ 62573 }) 62574 #define vshrd_n_s64(__p0, __p1) __extension__ ({ \ 62575 int64_t __ret; \ 62576 int64_t __s0 = __p0; \ 62577 __ret = (int64_t) __builtin_neon_vshrd_n_s64(__s0, __p1); \ 62578 __ret; \ 62579 }) 62580 #ifdef __LITTLE_ENDIAN__ 62581 #define vshrn_high_n_u32(__p0_748, __p1_748, __p2_748) __extension__ ({ \ 62582 uint16x8_t __ret_748; \ 62583 uint16x4_t __s0_748 = __p0_748; \ 62584 uint32x4_t __s1_748 = __p1_748; \ 62585 __ret_748 = (uint16x8_t)(vcombine_u16((uint16x4_t)(__s0_748), (uint16x4_t)(vshrn_n_u32(__s1_748, __p2_748)))); \ 62586 __ret_748; \ 62587 }) 62588 #else 62589 #define vshrn_high_n_u32(__p0_749, __p1_749, __p2_749) __extension__ ({ \ 62590 uint16x8_t __ret_749; \ 62591 uint16x4_t __s0_749 = __p0_749; \ 62592 uint32x4_t __s1_749 = __p1_749; \ 62593 uint16x4_t __rev0_749; __rev0_749 = __builtin_shufflevector(__s0_749, __s0_749, 3, 2, 1, 0); \ 62594 uint32x4_t __rev1_749; __rev1_749 = __builtin_shufflevector(__s1_749, __s1_749, 3, 2, 1, 0); \ 62595 __ret_749 = (uint16x8_t)(__noswap_vcombine_u16((uint16x4_t)(__rev0_749), (uint16x4_t)(__noswap_vshrn_n_u32(__rev1_749, __p2_749)))); \ 62596 __ret_749 = __builtin_shufflevector(__ret_749, __ret_749, 7, 6, 5, 4, 3, 2, 1, 0); \ 62597 __ret_749; \ 62598 }) 62599 #endif 62600 62601 #ifdef __LITTLE_ENDIAN__ 62602 #define vshrn_high_n_u64(__p0_750, __p1_750, __p2_750) __extension__ ({ \ 62603 uint32x4_t __ret_750; \ 62604 uint32x2_t __s0_750 = __p0_750; \ 62605 uint64x2_t __s1_750 = __p1_750; \ 62606 __ret_750 = (uint32x4_t)(vcombine_u32((uint32x2_t)(__s0_750), (uint32x2_t)(vshrn_n_u64(__s1_750, __p2_750)))); \ 62607 __ret_750; \ 62608 }) 62609 #else 62610 #define vshrn_high_n_u64(__p0_751, __p1_751, __p2_751) __extension__ ({ \ 62611 uint32x4_t __ret_751; \ 62612 uint32x2_t __s0_751 = __p0_751; \ 62613 uint64x2_t __s1_751 = __p1_751; \ 62614 uint32x2_t __rev0_751; __rev0_751 = __builtin_shufflevector(__s0_751, __s0_751, 1, 0); \ 62615 uint64x2_t __rev1_751; __rev1_751 = __builtin_shufflevector(__s1_751, __s1_751, 1, 0); \ 62616 __ret_751 = (uint32x4_t)(__noswap_vcombine_u32((uint32x2_t)(__rev0_751), (uint32x2_t)(__noswap_vshrn_n_u64(__rev1_751, __p2_751)))); \ 62617 __ret_751 = __builtin_shufflevector(__ret_751, __ret_751, 3, 2, 1, 0); \ 62618 __ret_751; \ 62619 }) 62620 #endif 62621 62622 #ifdef __LITTLE_ENDIAN__ 62623 #define vshrn_high_n_u16(__p0_752, __p1_752, __p2_752) __extension__ ({ \ 62624 uint8x16_t __ret_752; \ 62625 uint8x8_t __s0_752 = __p0_752; \ 62626 uint16x8_t __s1_752 = __p1_752; \ 62627 __ret_752 = (uint8x16_t)(vcombine_u8((uint8x8_t)(__s0_752), (uint8x8_t)(vshrn_n_u16(__s1_752, __p2_752)))); \ 62628 __ret_752; \ 62629 }) 62630 #else 62631 #define vshrn_high_n_u16(__p0_753, __p1_753, __p2_753) __extension__ ({ \ 62632 uint8x16_t __ret_753; \ 62633 uint8x8_t __s0_753 = __p0_753; \ 62634 uint16x8_t __s1_753 = __p1_753; \ 62635 uint8x8_t __rev0_753; __rev0_753 = __builtin_shufflevector(__s0_753, __s0_753, 7, 6, 5, 4, 3, 2, 1, 0); \ 62636 uint16x8_t __rev1_753; __rev1_753 = __builtin_shufflevector(__s1_753, __s1_753, 7, 6, 5, 4, 3, 2, 1, 0); \ 62637 __ret_753 = (uint8x16_t)(__noswap_vcombine_u8((uint8x8_t)(__rev0_753), (uint8x8_t)(__noswap_vshrn_n_u16(__rev1_753, __p2_753)))); \ 62638 __ret_753 = __builtin_shufflevector(__ret_753, __ret_753, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 62639 __ret_753; \ 62640 }) 62641 #endif 62642 62643 #ifdef __LITTLE_ENDIAN__ 62644 #define vshrn_high_n_s32(__p0_754, __p1_754, __p2_754) __extension__ ({ \ 62645 int16x8_t __ret_754; \ 62646 int16x4_t __s0_754 = __p0_754; \ 62647 int32x4_t __s1_754 = __p1_754; \ 62648 __ret_754 = (int16x8_t)(vcombine_s16((int16x4_t)(__s0_754), (int16x4_t)(vshrn_n_s32(__s1_754, __p2_754)))); \ 62649 __ret_754; \ 62650 }) 62651 #else 62652 #define vshrn_high_n_s32(__p0_755, __p1_755, __p2_755) __extension__ ({ \ 62653 int16x8_t __ret_755; \ 62654 int16x4_t __s0_755 = __p0_755; \ 62655 int32x4_t __s1_755 = __p1_755; \ 62656 int16x4_t __rev0_755; __rev0_755 = __builtin_shufflevector(__s0_755, __s0_755, 3, 2, 1, 0); \ 62657 int32x4_t __rev1_755; __rev1_755 = __builtin_shufflevector(__s1_755, __s1_755, 3, 2, 1, 0); \ 62658 __ret_755 = (int16x8_t)(__noswap_vcombine_s16((int16x4_t)(__rev0_755), (int16x4_t)(__noswap_vshrn_n_s32(__rev1_755, __p2_755)))); \ 62659 __ret_755 = __builtin_shufflevector(__ret_755, __ret_755, 7, 6, 5, 4, 3, 2, 1, 0); \ 62660 __ret_755; \ 62661 }) 62662 #endif 62663 62664 #ifdef __LITTLE_ENDIAN__ 62665 #define vshrn_high_n_s64(__p0_756, __p1_756, __p2_756) __extension__ ({ \ 62666 int32x4_t __ret_756; \ 62667 int32x2_t __s0_756 = __p0_756; \ 62668 int64x2_t __s1_756 = __p1_756; \ 62669 __ret_756 = (int32x4_t)(vcombine_s32((int32x2_t)(__s0_756), (int32x2_t)(vshrn_n_s64(__s1_756, __p2_756)))); \ 62670 __ret_756; \ 62671 }) 62672 #else 62673 #define vshrn_high_n_s64(__p0_757, __p1_757, __p2_757) __extension__ ({ \ 62674 int32x4_t __ret_757; \ 62675 int32x2_t __s0_757 = __p0_757; \ 62676 int64x2_t __s1_757 = __p1_757; \ 62677 int32x2_t __rev0_757; __rev0_757 = __builtin_shufflevector(__s0_757, __s0_757, 1, 0); \ 62678 int64x2_t __rev1_757; __rev1_757 = __builtin_shufflevector(__s1_757, __s1_757, 1, 0); \ 62679 __ret_757 = (int32x4_t)(__noswap_vcombine_s32((int32x2_t)(__rev0_757), (int32x2_t)(__noswap_vshrn_n_s64(__rev1_757, __p2_757)))); \ 62680 __ret_757 = __builtin_shufflevector(__ret_757, __ret_757, 3, 2, 1, 0); \ 62681 __ret_757; \ 62682 }) 62683 #endif 62684 62685 #ifdef __LITTLE_ENDIAN__ 62686 #define vshrn_high_n_s16(__p0_758, __p1_758, __p2_758) __extension__ ({ \ 62687 int8x16_t __ret_758; \ 62688 int8x8_t __s0_758 = __p0_758; \ 62689 int16x8_t __s1_758 = __p1_758; \ 62690 __ret_758 = (int8x16_t)(vcombine_s8((int8x8_t)(__s0_758), (int8x8_t)(vshrn_n_s16(__s1_758, __p2_758)))); \ 62691 __ret_758; \ 62692 }) 62693 #else 62694 #define vshrn_high_n_s16(__p0_759, __p1_759, __p2_759) __extension__ ({ \ 62695 int8x16_t __ret_759; \ 62696 int8x8_t __s0_759 = __p0_759; \ 62697 int16x8_t __s1_759 = __p1_759; \ 62698 int8x8_t __rev0_759; __rev0_759 = __builtin_shufflevector(__s0_759, __s0_759, 7, 6, 5, 4, 3, 2, 1, 0); \ 62699 int16x8_t __rev1_759; __rev1_759 = __builtin_shufflevector(__s1_759, __s1_759, 7, 6, 5, 4, 3, 2, 1, 0); \ 62700 __ret_759 = (int8x16_t)(__noswap_vcombine_s8((int8x8_t)(__rev0_759), (int8x8_t)(__noswap_vshrn_n_s16(__rev1_759, __p2_759)))); \ 62701 __ret_759 = __builtin_shufflevector(__ret_759, __ret_759, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 62702 __ret_759; \ 62703 }) 62704 #endif 62705 62706 #define vslid_n_u64(__p0, __p1, __p2) __extension__ ({ \ 62707 uint64_t __ret; \ 62708 uint64_t __s0 = __p0; \ 62709 uint64_t __s1 = __p1; \ 62710 __ret = (uint64_t) __builtin_neon_vslid_n_u64(__s0, __s1, __p2); \ 62711 __ret; \ 62712 }) 62713 #define vslid_n_s64(__p0, __p1, __p2) __extension__ ({ \ 62714 int64_t __ret; \ 62715 int64_t __s0 = __p0; \ 62716 int64_t __s1 = __p1; \ 62717 __ret = (int64_t) __builtin_neon_vslid_n_s64(__s0, __s1, __p2); \ 62718 __ret; \ 62719 }) 62720 #define vsli_n_p64(__p0, __p1, __p2) __extension__ ({ \ 62721 poly64x1_t __ret; \ 62722 poly64x1_t __s0 = __p0; \ 62723 poly64x1_t __s1 = __p1; \ 62724 __ret = (poly64x1_t) __builtin_neon_vsli_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 6); \ 62725 __ret; \ 62726 }) 62727 #ifdef __LITTLE_ENDIAN__ 62728 #define vsliq_n_p64(__p0, __p1, __p2) __extension__ ({ \ 62729 poly64x2_t __ret; \ 62730 poly64x2_t __s0 = __p0; \ 62731 poly64x2_t __s1 = __p1; \ 62732 __ret = (poly64x2_t) __builtin_neon_vsliq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 38); \ 62733 __ret; \ 62734 }) 62735 #else 62736 #define vsliq_n_p64(__p0, __p1, __p2) __extension__ ({ \ 62737 poly64x2_t __ret; \ 62738 poly64x2_t __s0 = __p0; \ 62739 poly64x2_t __s1 = __p1; \ 62740 poly64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 62741 poly64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 62742 __ret = (poly64x2_t) __builtin_neon_vsliq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 38); \ 62743 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 62744 __ret; \ 62745 }) 62746 #endif 62747 62748 __ai __attribute__((target("neon"))) uint8_t vsqaddb_u8(uint8_t __p0, int8_t __p1) { 62749 uint8_t __ret; 62750 __ret = (uint8_t) __builtin_neon_vsqaddb_u8(__p0, __p1); 62751 return __ret; 62752 } 62753 __ai __attribute__((target("neon"))) uint32_t vsqadds_u32(uint32_t __p0, int32_t __p1) { 62754 uint32_t __ret; 62755 __ret = (uint32_t) __builtin_neon_vsqadds_u32(__p0, __p1); 62756 return __ret; 62757 } 62758 __ai __attribute__((target("neon"))) uint64_t vsqaddd_u64(uint64_t __p0, int64_t __p1) { 62759 uint64_t __ret; 62760 __ret = (uint64_t) __builtin_neon_vsqaddd_u64(__p0, __p1); 62761 return __ret; 62762 } 62763 __ai __attribute__((target("neon"))) uint16_t vsqaddh_u16(uint16_t __p0, int16_t __p1) { 62764 uint16_t __ret; 62765 __ret = (uint16_t) __builtin_neon_vsqaddh_u16(__p0, __p1); 62766 return __ret; 62767 } 62768 #ifdef __LITTLE_ENDIAN__ 62769 __ai __attribute__((target("neon"))) uint8x16_t vsqaddq_u8(uint8x16_t __p0, int8x16_t __p1) { 62770 uint8x16_t __ret; 62771 __ret = (uint8x16_t) __builtin_neon_vsqaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 48); 62772 return __ret; 62773 } 62774 #else 62775 __ai __attribute__((target("neon"))) uint8x16_t vsqaddq_u8(uint8x16_t __p0, int8x16_t __p1) { 62776 uint8x16_t __ret; 62777 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 62778 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 62779 __ret = (uint8x16_t) __builtin_neon_vsqaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 48); 62780 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 62781 return __ret; 62782 } 62783 #endif 62784 62785 #ifdef __LITTLE_ENDIAN__ 62786 __ai __attribute__((target("neon"))) uint32x4_t vsqaddq_u32(uint32x4_t __p0, int32x4_t __p1) { 62787 uint32x4_t __ret; 62788 __ret = (uint32x4_t) __builtin_neon_vsqaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 50); 62789 return __ret; 62790 } 62791 #else 62792 __ai __attribute__((target("neon"))) uint32x4_t vsqaddq_u32(uint32x4_t __p0, int32x4_t __p1) { 62793 uint32x4_t __ret; 62794 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 62795 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 62796 __ret = (uint32x4_t) __builtin_neon_vsqaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 50); 62797 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 62798 return __ret; 62799 } 62800 #endif 62801 62802 #ifdef __LITTLE_ENDIAN__ 62803 __ai __attribute__((target("neon"))) uint64x2_t vsqaddq_u64(uint64x2_t __p0, int64x2_t __p1) { 62804 uint64x2_t __ret; 62805 __ret = (uint64x2_t) __builtin_neon_vsqaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 51); 62806 return __ret; 62807 } 62808 #else 62809 __ai __attribute__((target("neon"))) uint64x2_t vsqaddq_u64(uint64x2_t __p0, int64x2_t __p1) { 62810 uint64x2_t __ret; 62811 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 62812 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 62813 __ret = (uint64x2_t) __builtin_neon_vsqaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 51); 62814 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 62815 return __ret; 62816 } 62817 #endif 62818 62819 #ifdef __LITTLE_ENDIAN__ 62820 __ai __attribute__((target("neon"))) uint16x8_t vsqaddq_u16(uint16x8_t __p0, int16x8_t __p1) { 62821 uint16x8_t __ret; 62822 __ret = (uint16x8_t) __builtin_neon_vsqaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 49); 62823 return __ret; 62824 } 62825 #else 62826 __ai __attribute__((target("neon"))) uint16x8_t vsqaddq_u16(uint16x8_t __p0, int16x8_t __p1) { 62827 uint16x8_t __ret; 62828 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 62829 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 62830 __ret = (uint16x8_t) __builtin_neon_vsqaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 49); 62831 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 62832 return __ret; 62833 } 62834 #endif 62835 62836 #ifdef __LITTLE_ENDIAN__ 62837 __ai __attribute__((target("neon"))) uint8x8_t vsqadd_u8(uint8x8_t __p0, int8x8_t __p1) { 62838 uint8x8_t __ret; 62839 __ret = (uint8x8_t) __builtin_neon_vsqadd_v((int8x8_t)__p0, (int8x8_t)__p1, 16); 62840 return __ret; 62841 } 62842 #else 62843 __ai __attribute__((target("neon"))) uint8x8_t vsqadd_u8(uint8x8_t __p0, int8x8_t __p1) { 62844 uint8x8_t __ret; 62845 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 62846 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 62847 __ret = (uint8x8_t) __builtin_neon_vsqadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 16); 62848 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 62849 return __ret; 62850 } 62851 #endif 62852 62853 #ifdef __LITTLE_ENDIAN__ 62854 __ai __attribute__((target("neon"))) uint32x2_t vsqadd_u32(uint32x2_t __p0, int32x2_t __p1) { 62855 uint32x2_t __ret; 62856 __ret = (uint32x2_t) __builtin_neon_vsqadd_v((int8x8_t)__p0, (int8x8_t)__p1, 18); 62857 return __ret; 62858 } 62859 #else 62860 __ai __attribute__((target("neon"))) uint32x2_t vsqadd_u32(uint32x2_t __p0, int32x2_t __p1) { 62861 uint32x2_t __ret; 62862 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 62863 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 62864 __ret = (uint32x2_t) __builtin_neon_vsqadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 18); 62865 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 62866 return __ret; 62867 } 62868 #endif 62869 62870 __ai __attribute__((target("neon"))) uint64x1_t vsqadd_u64(uint64x1_t __p0, int64x1_t __p1) { 62871 uint64x1_t __ret; 62872 __ret = (uint64x1_t) __builtin_neon_vsqadd_v((int8x8_t)__p0, (int8x8_t)__p1, 19); 62873 return __ret; 62874 } 62875 #ifdef __LITTLE_ENDIAN__ 62876 __ai __attribute__((target("neon"))) uint16x4_t vsqadd_u16(uint16x4_t __p0, int16x4_t __p1) { 62877 uint16x4_t __ret; 62878 __ret = (uint16x4_t) __builtin_neon_vsqadd_v((int8x8_t)__p0, (int8x8_t)__p1, 17); 62879 return __ret; 62880 } 62881 #else 62882 __ai __attribute__((target("neon"))) uint16x4_t vsqadd_u16(uint16x4_t __p0, int16x4_t __p1) { 62883 uint16x4_t __ret; 62884 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 62885 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 62886 __ret = (uint16x4_t) __builtin_neon_vsqadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 17); 62887 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 62888 return __ret; 62889 } 62890 #endif 62891 62892 #ifdef __LITTLE_ENDIAN__ 62893 __ai __attribute__((target("neon"))) float64x2_t vsqrtq_f64(float64x2_t __p0) { 62894 float64x2_t __ret; 62895 __ret = (float64x2_t) __builtin_neon_vsqrtq_v((int8x16_t)__p0, 42); 62896 return __ret; 62897 } 62898 #else 62899 __ai __attribute__((target("neon"))) float64x2_t vsqrtq_f64(float64x2_t __p0) { 62900 float64x2_t __ret; 62901 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 62902 __ret = (float64x2_t) __builtin_neon_vsqrtq_v((int8x16_t)__rev0, 42); 62903 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 62904 return __ret; 62905 } 62906 #endif 62907 62908 #ifdef __LITTLE_ENDIAN__ 62909 __ai __attribute__((target("neon"))) float32x4_t vsqrtq_f32(float32x4_t __p0) { 62910 float32x4_t __ret; 62911 __ret = (float32x4_t) __builtin_neon_vsqrtq_v((int8x16_t)__p0, 41); 62912 return __ret; 62913 } 62914 #else 62915 __ai __attribute__((target("neon"))) float32x4_t vsqrtq_f32(float32x4_t __p0) { 62916 float32x4_t __ret; 62917 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 62918 __ret = (float32x4_t) __builtin_neon_vsqrtq_v((int8x16_t)__rev0, 41); 62919 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 62920 return __ret; 62921 } 62922 #endif 62923 62924 __ai __attribute__((target("neon"))) float64x1_t vsqrt_f64(float64x1_t __p0) { 62925 float64x1_t __ret; 62926 __ret = (float64x1_t) __builtin_neon_vsqrt_v((int8x8_t)__p0, 10); 62927 return __ret; 62928 } 62929 #ifdef __LITTLE_ENDIAN__ 62930 __ai __attribute__((target("neon"))) float32x2_t vsqrt_f32(float32x2_t __p0) { 62931 float32x2_t __ret; 62932 __ret = (float32x2_t) __builtin_neon_vsqrt_v((int8x8_t)__p0, 9); 62933 return __ret; 62934 } 62935 #else 62936 __ai __attribute__((target("neon"))) float32x2_t vsqrt_f32(float32x2_t __p0) { 62937 float32x2_t __ret; 62938 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 62939 __ret = (float32x2_t) __builtin_neon_vsqrt_v((int8x8_t)__rev0, 9); 62940 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 62941 return __ret; 62942 } 62943 #endif 62944 62945 #define vsrad_n_u64(__p0, __p1, __p2) __extension__ ({ \ 62946 uint64_t __ret; \ 62947 uint64_t __s0 = __p0; \ 62948 uint64_t __s1 = __p1; \ 62949 __ret = (uint64_t) __builtin_neon_vsrad_n_u64(__s0, __s1, __p2); \ 62950 __ret; \ 62951 }) 62952 #define vsrad_n_s64(__p0, __p1, __p2) __extension__ ({ \ 62953 int64_t __ret; \ 62954 int64_t __s0 = __p0; \ 62955 int64_t __s1 = __p1; \ 62956 __ret = (int64_t) __builtin_neon_vsrad_n_s64(__s0, __s1, __p2); \ 62957 __ret; \ 62958 }) 62959 #define vsrid_n_u64(__p0, __p1, __p2) __extension__ ({ \ 62960 uint64_t __ret; \ 62961 uint64_t __s0 = __p0; \ 62962 uint64_t __s1 = __p1; \ 62963 __ret = (uint64_t) __builtin_neon_vsrid_n_u64(__s0, __s1, __p2); \ 62964 __ret; \ 62965 }) 62966 #define vsrid_n_s64(__p0, __p1, __p2) __extension__ ({ \ 62967 int64_t __ret; \ 62968 int64_t __s0 = __p0; \ 62969 int64_t __s1 = __p1; \ 62970 __ret = (int64_t) __builtin_neon_vsrid_n_s64(__s0, __s1, __p2); \ 62971 __ret; \ 62972 }) 62973 #define vsri_n_p64(__p0, __p1, __p2) __extension__ ({ \ 62974 poly64x1_t __ret; \ 62975 poly64x1_t __s0 = __p0; \ 62976 poly64x1_t __s1 = __p1; \ 62977 __ret = (poly64x1_t) __builtin_neon_vsri_n_v((int8x8_t)__s0, (int8x8_t)__s1, __p2, 6); \ 62978 __ret; \ 62979 }) 62980 #ifdef __LITTLE_ENDIAN__ 62981 #define vsriq_n_p64(__p0, __p1, __p2) __extension__ ({ \ 62982 poly64x2_t __ret; \ 62983 poly64x2_t __s0 = __p0; \ 62984 poly64x2_t __s1 = __p1; \ 62985 __ret = (poly64x2_t) __builtin_neon_vsriq_n_v((int8x16_t)__s0, (int8x16_t)__s1, __p2, 38); \ 62986 __ret; \ 62987 }) 62988 #else 62989 #define vsriq_n_p64(__p0, __p1, __p2) __extension__ ({ \ 62990 poly64x2_t __ret; \ 62991 poly64x2_t __s0 = __p0; \ 62992 poly64x2_t __s1 = __p1; \ 62993 poly64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 62994 poly64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 62995 __ret = (poly64x2_t) __builtin_neon_vsriq_n_v((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 38); \ 62996 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 62997 __ret; \ 62998 }) 62999 #endif 63000 63001 #define vst1_p64(__p0, __p1) __extension__ ({ \ 63002 poly64x1_t __s1 = __p1; \ 63003 __builtin_neon_vst1_v(__p0, (int8x8_t)__s1, 6); \ 63004 }) 63005 #ifdef __LITTLE_ENDIAN__ 63006 #define vst1q_p64(__p0, __p1) __extension__ ({ \ 63007 poly64x2_t __s1 = __p1; \ 63008 __builtin_neon_vst1q_v(__p0, (int8x16_t)__s1, 38); \ 63009 }) 63010 #else 63011 #define vst1q_p64(__p0, __p1) __extension__ ({ \ 63012 poly64x2_t __s1 = __p1; \ 63013 poly64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 63014 __builtin_neon_vst1q_v(__p0, (int8x16_t)__rev1, 38); \ 63015 }) 63016 #endif 63017 63018 #ifdef __LITTLE_ENDIAN__ 63019 #define vst1q_f64(__p0, __p1) __extension__ ({ \ 63020 float64x2_t __s1 = __p1; \ 63021 __builtin_neon_vst1q_v(__p0, (int8x16_t)__s1, 42); \ 63022 }) 63023 #else 63024 #define vst1q_f64(__p0, __p1) __extension__ ({ \ 63025 float64x2_t __s1 = __p1; \ 63026 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 63027 __builtin_neon_vst1q_v(__p0, (int8x16_t)__rev1, 42); \ 63028 }) 63029 #endif 63030 63031 #define vst1_f64(__p0, __p1) __extension__ ({ \ 63032 float64x1_t __s1 = __p1; \ 63033 __builtin_neon_vst1_v(__p0, (int8x8_t)__s1, 10); \ 63034 }) 63035 #define vst1_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 63036 poly64x1_t __s1 = __p1; \ 63037 __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__s1, __p2, 6); \ 63038 }) 63039 #ifdef __LITTLE_ENDIAN__ 63040 #define vst1q_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 63041 poly64x2_t __s1 = __p1; \ 63042 __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__s1, __p2, 38); \ 63043 }) 63044 #else 63045 #define vst1q_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 63046 poly64x2_t __s1 = __p1; \ 63047 poly64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 63048 __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 38); \ 63049 }) 63050 #endif 63051 63052 #ifdef __LITTLE_ENDIAN__ 63053 #define vst1q_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 63054 float64x2_t __s1 = __p1; \ 63055 __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__s1, __p2, 42); \ 63056 }) 63057 #else 63058 #define vst1q_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 63059 float64x2_t __s1 = __p1; \ 63060 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 63061 __builtin_neon_vst1q_lane_v(__p0, (int8x16_t)__rev1, __p2, 42); \ 63062 }) 63063 #endif 63064 63065 #define vst1_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 63066 float64x1_t __s1 = __p1; \ 63067 __builtin_neon_vst1_lane_v(__p0, (int8x8_t)__s1, __p2, 10); \ 63068 }) 63069 #define vst1_p64_x2(__p0, __p1) __extension__ ({ \ 63070 poly64x1x2_t __s1 = __p1; \ 63071 __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 6); \ 63072 }) 63073 #ifdef __LITTLE_ENDIAN__ 63074 #define vst1q_p64_x2(__p0, __p1) __extension__ ({ \ 63075 poly64x2x2_t __s1 = __p1; \ 63076 __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 38); \ 63077 }) 63078 #else 63079 #define vst1q_p64_x2(__p0, __p1) __extension__ ({ \ 63080 poly64x2x2_t __s1 = __p1; \ 63081 poly64x2x2_t __rev1; \ 63082 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 63083 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 63084 __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 38); \ 63085 }) 63086 #endif 63087 63088 #ifdef __LITTLE_ENDIAN__ 63089 #define vst1q_f64_x2(__p0, __p1) __extension__ ({ \ 63090 float64x2x2_t __s1 = __p1; \ 63091 __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 42); \ 63092 }) 63093 #else 63094 #define vst1q_f64_x2(__p0, __p1) __extension__ ({ \ 63095 float64x2x2_t __s1 = __p1; \ 63096 float64x2x2_t __rev1; \ 63097 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 63098 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 63099 __builtin_neon_vst1q_x2_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 42); \ 63100 }) 63101 #endif 63102 63103 #define vst1_f64_x2(__p0, __p1) __extension__ ({ \ 63104 float64x1x2_t __s1 = __p1; \ 63105 __builtin_neon_vst1_x2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 10); \ 63106 }) 63107 #define vst1_p64_x3(__p0, __p1) __extension__ ({ \ 63108 poly64x1x3_t __s1 = __p1; \ 63109 __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 6); \ 63110 }) 63111 #ifdef __LITTLE_ENDIAN__ 63112 #define vst1q_p64_x3(__p0, __p1) __extension__ ({ \ 63113 poly64x2x3_t __s1 = __p1; \ 63114 __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 38); \ 63115 }) 63116 #else 63117 #define vst1q_p64_x3(__p0, __p1) __extension__ ({ \ 63118 poly64x2x3_t __s1 = __p1; \ 63119 poly64x2x3_t __rev1; \ 63120 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 63121 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 63122 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 63123 __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 38); \ 63124 }) 63125 #endif 63126 63127 #ifdef __LITTLE_ENDIAN__ 63128 #define vst1q_f64_x3(__p0, __p1) __extension__ ({ \ 63129 float64x2x3_t __s1 = __p1; \ 63130 __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 42); \ 63131 }) 63132 #else 63133 #define vst1q_f64_x3(__p0, __p1) __extension__ ({ \ 63134 float64x2x3_t __s1 = __p1; \ 63135 float64x2x3_t __rev1; \ 63136 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 63137 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 63138 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 63139 __builtin_neon_vst1q_x3_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 42); \ 63140 }) 63141 #endif 63142 63143 #define vst1_f64_x3(__p0, __p1) __extension__ ({ \ 63144 float64x1x3_t __s1 = __p1; \ 63145 __builtin_neon_vst1_x3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 10); \ 63146 }) 63147 #define vst1_p64_x4(__p0, __p1) __extension__ ({ \ 63148 poly64x1x4_t __s1 = __p1; \ 63149 __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 6); \ 63150 }) 63151 #ifdef __LITTLE_ENDIAN__ 63152 #define vst1q_p64_x4(__p0, __p1) __extension__ ({ \ 63153 poly64x2x4_t __s1 = __p1; \ 63154 __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 38); \ 63155 }) 63156 #else 63157 #define vst1q_p64_x4(__p0, __p1) __extension__ ({ \ 63158 poly64x2x4_t __s1 = __p1; \ 63159 poly64x2x4_t __rev1; \ 63160 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 63161 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 63162 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 63163 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \ 63164 __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 38); \ 63165 }) 63166 #endif 63167 63168 #ifdef __LITTLE_ENDIAN__ 63169 #define vst1q_f64_x4(__p0, __p1) __extension__ ({ \ 63170 float64x2x4_t __s1 = __p1; \ 63171 __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 42); \ 63172 }) 63173 #else 63174 #define vst1q_f64_x4(__p0, __p1) __extension__ ({ \ 63175 float64x2x4_t __s1 = __p1; \ 63176 float64x2x4_t __rev1; \ 63177 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 63178 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 63179 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 63180 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \ 63181 __builtin_neon_vst1q_x4_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 42); \ 63182 }) 63183 #endif 63184 63185 #define vst1_f64_x4(__p0, __p1) __extension__ ({ \ 63186 float64x1x4_t __s1 = __p1; \ 63187 __builtin_neon_vst1_x4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 10); \ 63188 }) 63189 #define vst2_p64(__p0, __p1) __extension__ ({ \ 63190 poly64x1x2_t __s1 = __p1; \ 63191 __builtin_neon_vst2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 6); \ 63192 }) 63193 #ifdef __LITTLE_ENDIAN__ 63194 #define vst2q_p64(__p0, __p1) __extension__ ({ \ 63195 poly64x2x2_t __s1 = __p1; \ 63196 __builtin_neon_vst2q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 38); \ 63197 }) 63198 #else 63199 #define vst2q_p64(__p0, __p1) __extension__ ({ \ 63200 poly64x2x2_t __s1 = __p1; \ 63201 poly64x2x2_t __rev1; \ 63202 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 63203 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 63204 __builtin_neon_vst2q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 38); \ 63205 }) 63206 #endif 63207 63208 #ifdef __LITTLE_ENDIAN__ 63209 #define vst2q_u64(__p0, __p1) __extension__ ({ \ 63210 uint64x2x2_t __s1 = __p1; \ 63211 __builtin_neon_vst2q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 51); \ 63212 }) 63213 #else 63214 #define vst2q_u64(__p0, __p1) __extension__ ({ \ 63215 uint64x2x2_t __s1 = __p1; \ 63216 uint64x2x2_t __rev1; \ 63217 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 63218 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 63219 __builtin_neon_vst2q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 51); \ 63220 }) 63221 #endif 63222 63223 #ifdef __LITTLE_ENDIAN__ 63224 #define vst2q_f64(__p0, __p1) __extension__ ({ \ 63225 float64x2x2_t __s1 = __p1; \ 63226 __builtin_neon_vst2q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 42); \ 63227 }) 63228 #else 63229 #define vst2q_f64(__p0, __p1) __extension__ ({ \ 63230 float64x2x2_t __s1 = __p1; \ 63231 float64x2x2_t __rev1; \ 63232 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 63233 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 63234 __builtin_neon_vst2q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 42); \ 63235 }) 63236 #endif 63237 63238 #ifdef __LITTLE_ENDIAN__ 63239 #define vst2q_s64(__p0, __p1) __extension__ ({ \ 63240 int64x2x2_t __s1 = __p1; \ 63241 __builtin_neon_vst2q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], 35); \ 63242 }) 63243 #else 63244 #define vst2q_s64(__p0, __p1) __extension__ ({ \ 63245 int64x2x2_t __s1 = __p1; \ 63246 int64x2x2_t __rev1; \ 63247 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 63248 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 63249 __builtin_neon_vst2q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], 35); \ 63250 }) 63251 #endif 63252 63253 #define vst2_f64(__p0, __p1) __extension__ ({ \ 63254 float64x1x2_t __s1 = __p1; \ 63255 __builtin_neon_vst2_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], 10); \ 63256 }) 63257 #define vst2_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 63258 poly64x1x2_t __s1 = __p1; \ 63259 __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 6); \ 63260 }) 63261 #ifdef __LITTLE_ENDIAN__ 63262 #define vst2q_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 63263 poly8x16x2_t __s1 = __p1; \ 63264 __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 36); \ 63265 }) 63266 #else 63267 #define vst2q_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 63268 poly8x16x2_t __s1 = __p1; \ 63269 poly8x16x2_t __rev1; \ 63270 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 63271 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 63272 __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 36); \ 63273 }) 63274 #endif 63275 63276 #ifdef __LITTLE_ENDIAN__ 63277 #define vst2q_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 63278 poly64x2x2_t __s1 = __p1; \ 63279 __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 38); \ 63280 }) 63281 #else 63282 #define vst2q_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 63283 poly64x2x2_t __s1 = __p1; \ 63284 poly64x2x2_t __rev1; \ 63285 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 63286 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 63287 __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 38); \ 63288 }) 63289 #endif 63290 63291 #ifdef __LITTLE_ENDIAN__ 63292 #define vst2q_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 63293 uint8x16x2_t __s1 = __p1; \ 63294 __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 48); \ 63295 }) 63296 #else 63297 #define vst2q_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 63298 uint8x16x2_t __s1 = __p1; \ 63299 uint8x16x2_t __rev1; \ 63300 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 63301 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 63302 __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 48); \ 63303 }) 63304 #endif 63305 63306 #ifdef __LITTLE_ENDIAN__ 63307 #define vst2q_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 63308 uint64x2x2_t __s1 = __p1; \ 63309 __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 51); \ 63310 }) 63311 #else 63312 #define vst2q_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 63313 uint64x2x2_t __s1 = __p1; \ 63314 uint64x2x2_t __rev1; \ 63315 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 63316 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 63317 __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 51); \ 63318 }) 63319 #endif 63320 63321 #ifdef __LITTLE_ENDIAN__ 63322 #define vst2q_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 63323 int8x16x2_t __s1 = __p1; \ 63324 __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 32); \ 63325 }) 63326 #else 63327 #define vst2q_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 63328 int8x16x2_t __s1 = __p1; \ 63329 int8x16x2_t __rev1; \ 63330 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 63331 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 63332 __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 32); \ 63333 }) 63334 #endif 63335 63336 #ifdef __LITTLE_ENDIAN__ 63337 #define vst2q_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 63338 float64x2x2_t __s1 = __p1; \ 63339 __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 42); \ 63340 }) 63341 #else 63342 #define vst2q_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 63343 float64x2x2_t __s1 = __p1; \ 63344 float64x2x2_t __rev1; \ 63345 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 63346 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 63347 __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 42); \ 63348 }) 63349 #endif 63350 63351 #ifdef __LITTLE_ENDIAN__ 63352 #define vst2q_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 63353 int64x2x2_t __s1 = __p1; \ 63354 __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], __p2, 35); \ 63355 }) 63356 #else 63357 #define vst2q_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 63358 int64x2x2_t __s1 = __p1; \ 63359 int64x2x2_t __rev1; \ 63360 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 63361 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 63362 __builtin_neon_vst2q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], __p2, 35); \ 63363 }) 63364 #endif 63365 63366 #define vst2_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 63367 uint64x1x2_t __s1 = __p1; \ 63368 __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 19); \ 63369 }) 63370 #define vst2_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 63371 float64x1x2_t __s1 = __p1; \ 63372 __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 10); \ 63373 }) 63374 #define vst2_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 63375 int64x1x2_t __s1 = __p1; \ 63376 __builtin_neon_vst2_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], __p2, 3); \ 63377 }) 63378 #define vst3_p64(__p0, __p1) __extension__ ({ \ 63379 poly64x1x3_t __s1 = __p1; \ 63380 __builtin_neon_vst3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 6); \ 63381 }) 63382 #ifdef __LITTLE_ENDIAN__ 63383 #define vst3q_p64(__p0, __p1) __extension__ ({ \ 63384 poly64x2x3_t __s1 = __p1; \ 63385 __builtin_neon_vst3q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 38); \ 63386 }) 63387 #else 63388 #define vst3q_p64(__p0, __p1) __extension__ ({ \ 63389 poly64x2x3_t __s1 = __p1; \ 63390 poly64x2x3_t __rev1; \ 63391 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 63392 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 63393 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 63394 __builtin_neon_vst3q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 38); \ 63395 }) 63396 #endif 63397 63398 #ifdef __LITTLE_ENDIAN__ 63399 #define vst3q_u64(__p0, __p1) __extension__ ({ \ 63400 uint64x2x3_t __s1 = __p1; \ 63401 __builtin_neon_vst3q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 51); \ 63402 }) 63403 #else 63404 #define vst3q_u64(__p0, __p1) __extension__ ({ \ 63405 uint64x2x3_t __s1 = __p1; \ 63406 uint64x2x3_t __rev1; \ 63407 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 63408 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 63409 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 63410 __builtin_neon_vst3q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 51); \ 63411 }) 63412 #endif 63413 63414 #ifdef __LITTLE_ENDIAN__ 63415 #define vst3q_f64(__p0, __p1) __extension__ ({ \ 63416 float64x2x3_t __s1 = __p1; \ 63417 __builtin_neon_vst3q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 42); \ 63418 }) 63419 #else 63420 #define vst3q_f64(__p0, __p1) __extension__ ({ \ 63421 float64x2x3_t __s1 = __p1; \ 63422 float64x2x3_t __rev1; \ 63423 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 63424 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 63425 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 63426 __builtin_neon_vst3q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 42); \ 63427 }) 63428 #endif 63429 63430 #ifdef __LITTLE_ENDIAN__ 63431 #define vst3q_s64(__p0, __p1) __extension__ ({ \ 63432 int64x2x3_t __s1 = __p1; \ 63433 __builtin_neon_vst3q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], 35); \ 63434 }) 63435 #else 63436 #define vst3q_s64(__p0, __p1) __extension__ ({ \ 63437 int64x2x3_t __s1 = __p1; \ 63438 int64x2x3_t __rev1; \ 63439 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 63440 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 63441 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 63442 __builtin_neon_vst3q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], 35); \ 63443 }) 63444 #endif 63445 63446 #define vst3_f64(__p0, __p1) __extension__ ({ \ 63447 float64x1x3_t __s1 = __p1; \ 63448 __builtin_neon_vst3_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], 10); \ 63449 }) 63450 #define vst3_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 63451 poly64x1x3_t __s1 = __p1; \ 63452 __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 6); \ 63453 }) 63454 #ifdef __LITTLE_ENDIAN__ 63455 #define vst3q_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 63456 poly8x16x3_t __s1 = __p1; \ 63457 __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 36); \ 63458 }) 63459 #else 63460 #define vst3q_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 63461 poly8x16x3_t __s1 = __p1; \ 63462 poly8x16x3_t __rev1; \ 63463 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 63464 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 63465 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 63466 __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 36); \ 63467 }) 63468 #endif 63469 63470 #ifdef __LITTLE_ENDIAN__ 63471 #define vst3q_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 63472 poly64x2x3_t __s1 = __p1; \ 63473 __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 38); \ 63474 }) 63475 #else 63476 #define vst3q_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 63477 poly64x2x3_t __s1 = __p1; \ 63478 poly64x2x3_t __rev1; \ 63479 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 63480 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 63481 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 63482 __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 38); \ 63483 }) 63484 #endif 63485 63486 #ifdef __LITTLE_ENDIAN__ 63487 #define vst3q_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 63488 uint8x16x3_t __s1 = __p1; \ 63489 __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 48); \ 63490 }) 63491 #else 63492 #define vst3q_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 63493 uint8x16x3_t __s1 = __p1; \ 63494 uint8x16x3_t __rev1; \ 63495 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 63496 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 63497 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 63498 __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 48); \ 63499 }) 63500 #endif 63501 63502 #ifdef __LITTLE_ENDIAN__ 63503 #define vst3q_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 63504 uint64x2x3_t __s1 = __p1; \ 63505 __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 51); \ 63506 }) 63507 #else 63508 #define vst3q_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 63509 uint64x2x3_t __s1 = __p1; \ 63510 uint64x2x3_t __rev1; \ 63511 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 63512 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 63513 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 63514 __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 51); \ 63515 }) 63516 #endif 63517 63518 #ifdef __LITTLE_ENDIAN__ 63519 #define vst3q_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 63520 int8x16x3_t __s1 = __p1; \ 63521 __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 32); \ 63522 }) 63523 #else 63524 #define vst3q_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 63525 int8x16x3_t __s1 = __p1; \ 63526 int8x16x3_t __rev1; \ 63527 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 63528 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 63529 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 63530 __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 32); \ 63531 }) 63532 #endif 63533 63534 #ifdef __LITTLE_ENDIAN__ 63535 #define vst3q_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 63536 float64x2x3_t __s1 = __p1; \ 63537 __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 42); \ 63538 }) 63539 #else 63540 #define vst3q_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 63541 float64x2x3_t __s1 = __p1; \ 63542 float64x2x3_t __rev1; \ 63543 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 63544 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 63545 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 63546 __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 42); \ 63547 }) 63548 #endif 63549 63550 #ifdef __LITTLE_ENDIAN__ 63551 #define vst3q_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 63552 int64x2x3_t __s1 = __p1; \ 63553 __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], __p2, 35); \ 63554 }) 63555 #else 63556 #define vst3q_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 63557 int64x2x3_t __s1 = __p1; \ 63558 int64x2x3_t __rev1; \ 63559 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 63560 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 63561 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 63562 __builtin_neon_vst3q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], __p2, 35); \ 63563 }) 63564 #endif 63565 63566 #define vst3_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 63567 uint64x1x3_t __s1 = __p1; \ 63568 __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 19); \ 63569 }) 63570 #define vst3_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 63571 float64x1x3_t __s1 = __p1; \ 63572 __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 10); \ 63573 }) 63574 #define vst3_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 63575 int64x1x3_t __s1 = __p1; \ 63576 __builtin_neon_vst3_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], __p2, 3); \ 63577 }) 63578 #define vst4_p64(__p0, __p1) __extension__ ({ \ 63579 poly64x1x4_t __s1 = __p1; \ 63580 __builtin_neon_vst4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 6); \ 63581 }) 63582 #ifdef __LITTLE_ENDIAN__ 63583 #define vst4q_p64(__p0, __p1) __extension__ ({ \ 63584 poly64x2x4_t __s1 = __p1; \ 63585 __builtin_neon_vst4q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 38); \ 63586 }) 63587 #else 63588 #define vst4q_p64(__p0, __p1) __extension__ ({ \ 63589 poly64x2x4_t __s1 = __p1; \ 63590 poly64x2x4_t __rev1; \ 63591 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 63592 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 63593 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 63594 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \ 63595 __builtin_neon_vst4q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 38); \ 63596 }) 63597 #endif 63598 63599 #ifdef __LITTLE_ENDIAN__ 63600 #define vst4q_u64(__p0, __p1) __extension__ ({ \ 63601 uint64x2x4_t __s1 = __p1; \ 63602 __builtin_neon_vst4q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 51); \ 63603 }) 63604 #else 63605 #define vst4q_u64(__p0, __p1) __extension__ ({ \ 63606 uint64x2x4_t __s1 = __p1; \ 63607 uint64x2x4_t __rev1; \ 63608 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 63609 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 63610 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 63611 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \ 63612 __builtin_neon_vst4q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 51); \ 63613 }) 63614 #endif 63615 63616 #ifdef __LITTLE_ENDIAN__ 63617 #define vst4q_f64(__p0, __p1) __extension__ ({ \ 63618 float64x2x4_t __s1 = __p1; \ 63619 __builtin_neon_vst4q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 42); \ 63620 }) 63621 #else 63622 #define vst4q_f64(__p0, __p1) __extension__ ({ \ 63623 float64x2x4_t __s1 = __p1; \ 63624 float64x2x4_t __rev1; \ 63625 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 63626 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 63627 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 63628 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \ 63629 __builtin_neon_vst4q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 42); \ 63630 }) 63631 #endif 63632 63633 #ifdef __LITTLE_ENDIAN__ 63634 #define vst4q_s64(__p0, __p1) __extension__ ({ \ 63635 int64x2x4_t __s1 = __p1; \ 63636 __builtin_neon_vst4q_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], 35); \ 63637 }) 63638 #else 63639 #define vst4q_s64(__p0, __p1) __extension__ ({ \ 63640 int64x2x4_t __s1 = __p1; \ 63641 int64x2x4_t __rev1; \ 63642 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 63643 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 63644 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 63645 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \ 63646 __builtin_neon_vst4q_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], 35); \ 63647 }) 63648 #endif 63649 63650 #define vst4_f64(__p0, __p1) __extension__ ({ \ 63651 float64x1x4_t __s1 = __p1; \ 63652 __builtin_neon_vst4_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], 10); \ 63653 }) 63654 #define vst4_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 63655 poly64x1x4_t __s1 = __p1; \ 63656 __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 6); \ 63657 }) 63658 #ifdef __LITTLE_ENDIAN__ 63659 #define vst4q_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 63660 poly8x16x4_t __s1 = __p1; \ 63661 __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 36); \ 63662 }) 63663 #else 63664 #define vst4q_lane_p8(__p0, __p1, __p2) __extension__ ({ \ 63665 poly8x16x4_t __s1 = __p1; \ 63666 poly8x16x4_t __rev1; \ 63667 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 63668 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 63669 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 63670 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 63671 __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 36); \ 63672 }) 63673 #endif 63674 63675 #ifdef __LITTLE_ENDIAN__ 63676 #define vst4q_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 63677 poly64x2x4_t __s1 = __p1; \ 63678 __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 38); \ 63679 }) 63680 #else 63681 #define vst4q_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 63682 poly64x2x4_t __s1 = __p1; \ 63683 poly64x2x4_t __rev1; \ 63684 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 63685 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 63686 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 63687 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \ 63688 __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 38); \ 63689 }) 63690 #endif 63691 63692 #ifdef __LITTLE_ENDIAN__ 63693 #define vst4q_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 63694 uint8x16x4_t __s1 = __p1; \ 63695 __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 48); \ 63696 }) 63697 #else 63698 #define vst4q_lane_u8(__p0, __p1, __p2) __extension__ ({ \ 63699 uint8x16x4_t __s1 = __p1; \ 63700 uint8x16x4_t __rev1; \ 63701 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 63702 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 63703 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 63704 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 63705 __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 48); \ 63706 }) 63707 #endif 63708 63709 #ifdef __LITTLE_ENDIAN__ 63710 #define vst4q_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 63711 uint64x2x4_t __s1 = __p1; \ 63712 __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 51); \ 63713 }) 63714 #else 63715 #define vst4q_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 63716 uint64x2x4_t __s1 = __p1; \ 63717 uint64x2x4_t __rev1; \ 63718 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 63719 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 63720 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 63721 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \ 63722 __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 51); \ 63723 }) 63724 #endif 63725 63726 #ifdef __LITTLE_ENDIAN__ 63727 #define vst4q_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 63728 int8x16x4_t __s1 = __p1; \ 63729 __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 32); \ 63730 }) 63731 #else 63732 #define vst4q_lane_s8(__p0, __p1, __p2) __extension__ ({ \ 63733 int8x16x4_t __s1 = __p1; \ 63734 int8x16x4_t __rev1; \ 63735 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 63736 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 63737 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 63738 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 63739 __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 32); \ 63740 }) 63741 #endif 63742 63743 #ifdef __LITTLE_ENDIAN__ 63744 #define vst4q_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 63745 float64x2x4_t __s1 = __p1; \ 63746 __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 42); \ 63747 }) 63748 #else 63749 #define vst4q_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 63750 float64x2x4_t __s1 = __p1; \ 63751 float64x2x4_t __rev1; \ 63752 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 63753 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 63754 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 63755 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \ 63756 __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 42); \ 63757 }) 63758 #endif 63759 63760 #ifdef __LITTLE_ENDIAN__ 63761 #define vst4q_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 63762 int64x2x4_t __s1 = __p1; \ 63763 __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__s1.val[0], (int8x16_t)__s1.val[1], (int8x16_t)__s1.val[2], (int8x16_t)__s1.val[3], __p2, 35); \ 63764 }) 63765 #else 63766 #define vst4q_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 63767 int64x2x4_t __s1 = __p1; \ 63768 int64x2x4_t __rev1; \ 63769 __rev1.val[0] = __builtin_shufflevector(__s1.val[0], __s1.val[0], 1, 0); \ 63770 __rev1.val[1] = __builtin_shufflevector(__s1.val[1], __s1.val[1], 1, 0); \ 63771 __rev1.val[2] = __builtin_shufflevector(__s1.val[2], __s1.val[2], 1, 0); \ 63772 __rev1.val[3] = __builtin_shufflevector(__s1.val[3], __s1.val[3], 1, 0); \ 63773 __builtin_neon_vst4q_lane_v(__p0, (int8x16_t)__rev1.val[0], (int8x16_t)__rev1.val[1], (int8x16_t)__rev1.val[2], (int8x16_t)__rev1.val[3], __p2, 35); \ 63774 }) 63775 #endif 63776 63777 #define vst4_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 63778 uint64x1x4_t __s1 = __p1; \ 63779 __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 19); \ 63780 }) 63781 #define vst4_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 63782 float64x1x4_t __s1 = __p1; \ 63783 __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 10); \ 63784 }) 63785 #define vst4_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 63786 int64x1x4_t __s1 = __p1; \ 63787 __builtin_neon_vst4_lane_v(__p0, (int8x8_t)__s1.val[0], (int8x8_t)__s1.val[1], (int8x8_t)__s1.val[2], (int8x8_t)__s1.val[3], __p2, 3); \ 63788 }) 63789 #define vstrq_p128(__p0, __p1) __extension__ ({ \ 63790 poly128_t __s1 = __p1; \ 63791 __builtin_neon_vstrq_p128(__p0, __s1); \ 63792 }) 63793 __ai __attribute__((target("neon"))) uint64_t vsubd_u64(uint64_t __p0, uint64_t __p1) { 63794 uint64_t __ret; 63795 __ret = (uint64_t) __builtin_neon_vsubd_u64(__p0, __p1); 63796 return __ret; 63797 } 63798 __ai __attribute__((target("neon"))) int64_t vsubd_s64(int64_t __p0, int64_t __p1) { 63799 int64_t __ret; 63800 __ret = (int64_t) __builtin_neon_vsubd_s64(__p0, __p1); 63801 return __ret; 63802 } 63803 #ifdef __LITTLE_ENDIAN__ 63804 __ai __attribute__((target("neon"))) float64x2_t vsubq_f64(float64x2_t __p0, float64x2_t __p1) { 63805 float64x2_t __ret; 63806 __ret = __p0 - __p1; 63807 return __ret; 63808 } 63809 #else 63810 __ai __attribute__((target("neon"))) float64x2_t vsubq_f64(float64x2_t __p0, float64x2_t __p1) { 63811 float64x2_t __ret; 63812 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 63813 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 63814 __ret = __rev0 - __rev1; 63815 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 63816 return __ret; 63817 } 63818 #endif 63819 63820 __ai __attribute__((target("neon"))) float64x1_t vsub_f64(float64x1_t __p0, float64x1_t __p1) { 63821 float64x1_t __ret; 63822 __ret = __p0 - __p1; 63823 return __ret; 63824 } 63825 #ifdef __LITTLE_ENDIAN__ 63826 __ai __attribute__((target("neon"))) uint16x8_t vsubhn_high_u32(uint16x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 63827 uint16x8_t __ret; 63828 __ret = vcombine_u16(__p0, vsubhn_u32(__p1, __p2)); 63829 return __ret; 63830 } 63831 #else 63832 __ai __attribute__((target("neon"))) uint16x8_t vsubhn_high_u32(uint16x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 63833 uint16x8_t __ret; 63834 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 63835 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 63836 uint32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 63837 __ret = __noswap_vcombine_u16(__rev0, __noswap_vsubhn_u32(__rev1, __rev2)); 63838 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 63839 return __ret; 63840 } 63841 #endif 63842 63843 #ifdef __LITTLE_ENDIAN__ 63844 __ai __attribute__((target("neon"))) uint32x4_t vsubhn_high_u64(uint32x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) { 63845 uint32x4_t __ret; 63846 __ret = vcombine_u32(__p0, vsubhn_u64(__p1, __p2)); 63847 return __ret; 63848 } 63849 #else 63850 __ai __attribute__((target("neon"))) uint32x4_t vsubhn_high_u64(uint32x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) { 63851 uint32x4_t __ret; 63852 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 63853 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 63854 uint64x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 63855 __ret = __noswap_vcombine_u32(__rev0, __noswap_vsubhn_u64(__rev1, __rev2)); 63856 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 63857 return __ret; 63858 } 63859 #endif 63860 63861 #ifdef __LITTLE_ENDIAN__ 63862 __ai __attribute__((target("neon"))) uint8x16_t vsubhn_high_u16(uint8x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) { 63863 uint8x16_t __ret; 63864 __ret = vcombine_u8(__p0, vsubhn_u16(__p1, __p2)); 63865 return __ret; 63866 } 63867 #else 63868 __ai __attribute__((target("neon"))) uint8x16_t vsubhn_high_u16(uint8x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) { 63869 uint8x16_t __ret; 63870 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 63871 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 63872 uint16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 63873 __ret = __noswap_vcombine_u8(__rev0, __noswap_vsubhn_u16(__rev1, __rev2)); 63874 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 63875 return __ret; 63876 } 63877 #endif 63878 63879 #ifdef __LITTLE_ENDIAN__ 63880 __ai __attribute__((target("neon"))) int16x8_t vsubhn_high_s32(int16x4_t __p0, int32x4_t __p1, int32x4_t __p2) { 63881 int16x8_t __ret; 63882 __ret = vcombine_s16(__p0, vsubhn_s32(__p1, __p2)); 63883 return __ret; 63884 } 63885 #else 63886 __ai __attribute__((target("neon"))) int16x8_t vsubhn_high_s32(int16x4_t __p0, int32x4_t __p1, int32x4_t __p2) { 63887 int16x8_t __ret; 63888 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 63889 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 63890 int32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 63891 __ret = __noswap_vcombine_s16(__rev0, __noswap_vsubhn_s32(__rev1, __rev2)); 63892 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 63893 return __ret; 63894 } 63895 #endif 63896 63897 #ifdef __LITTLE_ENDIAN__ 63898 __ai __attribute__((target("neon"))) int32x4_t vsubhn_high_s64(int32x2_t __p0, int64x2_t __p1, int64x2_t __p2) { 63899 int32x4_t __ret; 63900 __ret = vcombine_s32(__p0, vsubhn_s64(__p1, __p2)); 63901 return __ret; 63902 } 63903 #else 63904 __ai __attribute__((target("neon"))) int32x4_t vsubhn_high_s64(int32x2_t __p0, int64x2_t __p1, int64x2_t __p2) { 63905 int32x4_t __ret; 63906 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 63907 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 63908 int64x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 63909 __ret = __noswap_vcombine_s32(__rev0, __noswap_vsubhn_s64(__rev1, __rev2)); 63910 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 63911 return __ret; 63912 } 63913 #endif 63914 63915 #ifdef __LITTLE_ENDIAN__ 63916 __ai __attribute__((target("neon"))) int8x16_t vsubhn_high_s16(int8x8_t __p0, int16x8_t __p1, int16x8_t __p2) { 63917 int8x16_t __ret; 63918 __ret = vcombine_s8(__p0, vsubhn_s16(__p1, __p2)); 63919 return __ret; 63920 } 63921 #else 63922 __ai __attribute__((target("neon"))) int8x16_t vsubhn_high_s16(int8x8_t __p0, int16x8_t __p1, int16x8_t __p2) { 63923 int8x16_t __ret; 63924 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 63925 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 63926 int16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 63927 __ret = __noswap_vcombine_s8(__rev0, __noswap_vsubhn_s16(__rev1, __rev2)); 63928 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 63929 return __ret; 63930 } 63931 #endif 63932 63933 #ifdef __LITTLE_ENDIAN__ 63934 __ai __attribute__((target("neon"))) uint16x8_t vsubl_high_u8(uint8x16_t __p0, uint8x16_t __p1) { 63935 uint16x8_t __ret; 63936 __ret = vmovl_high_u8(__p0) - vmovl_high_u8(__p1); 63937 return __ret; 63938 } 63939 #else 63940 __ai __attribute__((target("neon"))) uint16x8_t vsubl_high_u8(uint8x16_t __p0, uint8x16_t __p1) { 63941 uint16x8_t __ret; 63942 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 63943 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 63944 __ret = __noswap_vmovl_high_u8(__rev0) - __noswap_vmovl_high_u8(__rev1); 63945 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 63946 return __ret; 63947 } 63948 #endif 63949 63950 #ifdef __LITTLE_ENDIAN__ 63951 __ai __attribute__((target("neon"))) uint64x2_t vsubl_high_u32(uint32x4_t __p0, uint32x4_t __p1) { 63952 uint64x2_t __ret; 63953 __ret = vmovl_high_u32(__p0) - vmovl_high_u32(__p1); 63954 return __ret; 63955 } 63956 #else 63957 __ai __attribute__((target("neon"))) uint64x2_t vsubl_high_u32(uint32x4_t __p0, uint32x4_t __p1) { 63958 uint64x2_t __ret; 63959 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 63960 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 63961 __ret = __noswap_vmovl_high_u32(__rev0) - __noswap_vmovl_high_u32(__rev1); 63962 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 63963 return __ret; 63964 } 63965 #endif 63966 63967 #ifdef __LITTLE_ENDIAN__ 63968 __ai __attribute__((target("neon"))) uint32x4_t vsubl_high_u16(uint16x8_t __p0, uint16x8_t __p1) { 63969 uint32x4_t __ret; 63970 __ret = vmovl_high_u16(__p0) - vmovl_high_u16(__p1); 63971 return __ret; 63972 } 63973 #else 63974 __ai __attribute__((target("neon"))) uint32x4_t vsubl_high_u16(uint16x8_t __p0, uint16x8_t __p1) { 63975 uint32x4_t __ret; 63976 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 63977 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 63978 __ret = __noswap_vmovl_high_u16(__rev0) - __noswap_vmovl_high_u16(__rev1); 63979 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 63980 return __ret; 63981 } 63982 #endif 63983 63984 #ifdef __LITTLE_ENDIAN__ 63985 __ai __attribute__((target("neon"))) int16x8_t vsubl_high_s8(int8x16_t __p0, int8x16_t __p1) { 63986 int16x8_t __ret; 63987 __ret = vmovl_high_s8(__p0) - vmovl_high_s8(__p1); 63988 return __ret; 63989 } 63990 #else 63991 __ai __attribute__((target("neon"))) int16x8_t vsubl_high_s8(int8x16_t __p0, int8x16_t __p1) { 63992 int16x8_t __ret; 63993 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 63994 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 63995 __ret = __noswap_vmovl_high_s8(__rev0) - __noswap_vmovl_high_s8(__rev1); 63996 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 63997 return __ret; 63998 } 63999 #endif 64000 64001 #ifdef __LITTLE_ENDIAN__ 64002 __ai __attribute__((target("neon"))) int64x2_t vsubl_high_s32(int32x4_t __p0, int32x4_t __p1) { 64003 int64x2_t __ret; 64004 __ret = vmovl_high_s32(__p0) - vmovl_high_s32(__p1); 64005 return __ret; 64006 } 64007 #else 64008 __ai __attribute__((target("neon"))) int64x2_t vsubl_high_s32(int32x4_t __p0, int32x4_t __p1) { 64009 int64x2_t __ret; 64010 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 64011 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 64012 __ret = __noswap_vmovl_high_s32(__rev0) - __noswap_vmovl_high_s32(__rev1); 64013 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 64014 return __ret; 64015 } 64016 #endif 64017 64018 #ifdef __LITTLE_ENDIAN__ 64019 __ai __attribute__((target("neon"))) int32x4_t vsubl_high_s16(int16x8_t __p0, int16x8_t __p1) { 64020 int32x4_t __ret; 64021 __ret = vmovl_high_s16(__p0) - vmovl_high_s16(__p1); 64022 return __ret; 64023 } 64024 #else 64025 __ai __attribute__((target("neon"))) int32x4_t vsubl_high_s16(int16x8_t __p0, int16x8_t __p1) { 64026 int32x4_t __ret; 64027 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 64028 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 64029 __ret = __noswap_vmovl_high_s16(__rev0) - __noswap_vmovl_high_s16(__rev1); 64030 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 64031 return __ret; 64032 } 64033 #endif 64034 64035 #ifdef __LITTLE_ENDIAN__ 64036 __ai __attribute__((target("neon"))) uint16x8_t vsubw_high_u8(uint16x8_t __p0, uint8x16_t __p1) { 64037 uint16x8_t __ret; 64038 __ret = __p0 - vmovl_high_u8(__p1); 64039 return __ret; 64040 } 64041 #else 64042 __ai __attribute__((target("neon"))) uint16x8_t vsubw_high_u8(uint16x8_t __p0, uint8x16_t __p1) { 64043 uint16x8_t __ret; 64044 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 64045 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 64046 __ret = __rev0 - __noswap_vmovl_high_u8(__rev1); 64047 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 64048 return __ret; 64049 } 64050 #endif 64051 64052 #ifdef __LITTLE_ENDIAN__ 64053 __ai __attribute__((target("neon"))) uint64x2_t vsubw_high_u32(uint64x2_t __p0, uint32x4_t __p1) { 64054 uint64x2_t __ret; 64055 __ret = __p0 - vmovl_high_u32(__p1); 64056 return __ret; 64057 } 64058 #else 64059 __ai __attribute__((target("neon"))) uint64x2_t vsubw_high_u32(uint64x2_t __p0, uint32x4_t __p1) { 64060 uint64x2_t __ret; 64061 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 64062 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 64063 __ret = __rev0 - __noswap_vmovl_high_u32(__rev1); 64064 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 64065 return __ret; 64066 } 64067 #endif 64068 64069 #ifdef __LITTLE_ENDIAN__ 64070 __ai __attribute__((target("neon"))) uint32x4_t vsubw_high_u16(uint32x4_t __p0, uint16x8_t __p1) { 64071 uint32x4_t __ret; 64072 __ret = __p0 - vmovl_high_u16(__p1); 64073 return __ret; 64074 } 64075 #else 64076 __ai __attribute__((target("neon"))) uint32x4_t vsubw_high_u16(uint32x4_t __p0, uint16x8_t __p1) { 64077 uint32x4_t __ret; 64078 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 64079 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 64080 __ret = __rev0 - __noswap_vmovl_high_u16(__rev1); 64081 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 64082 return __ret; 64083 } 64084 #endif 64085 64086 #ifdef __LITTLE_ENDIAN__ 64087 __ai __attribute__((target("neon"))) int16x8_t vsubw_high_s8(int16x8_t __p0, int8x16_t __p1) { 64088 int16x8_t __ret; 64089 __ret = __p0 - vmovl_high_s8(__p1); 64090 return __ret; 64091 } 64092 #else 64093 __ai __attribute__((target("neon"))) int16x8_t vsubw_high_s8(int16x8_t __p0, int8x16_t __p1) { 64094 int16x8_t __ret; 64095 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 64096 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 64097 __ret = __rev0 - __noswap_vmovl_high_s8(__rev1); 64098 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 64099 return __ret; 64100 } 64101 #endif 64102 64103 #ifdef __LITTLE_ENDIAN__ 64104 __ai __attribute__((target("neon"))) int64x2_t vsubw_high_s32(int64x2_t __p0, int32x4_t __p1) { 64105 int64x2_t __ret; 64106 __ret = __p0 - vmovl_high_s32(__p1); 64107 return __ret; 64108 } 64109 #else 64110 __ai __attribute__((target("neon"))) int64x2_t vsubw_high_s32(int64x2_t __p0, int32x4_t __p1) { 64111 int64x2_t __ret; 64112 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 64113 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 64114 __ret = __rev0 - __noswap_vmovl_high_s32(__rev1); 64115 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 64116 return __ret; 64117 } 64118 #endif 64119 64120 #ifdef __LITTLE_ENDIAN__ 64121 __ai __attribute__((target("neon"))) int32x4_t vsubw_high_s16(int32x4_t __p0, int16x8_t __p1) { 64122 int32x4_t __ret; 64123 __ret = __p0 - vmovl_high_s16(__p1); 64124 return __ret; 64125 } 64126 #else 64127 __ai __attribute__((target("neon"))) int32x4_t vsubw_high_s16(int32x4_t __p0, int16x8_t __p1) { 64128 int32x4_t __ret; 64129 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 64130 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 64131 __ret = __rev0 - __noswap_vmovl_high_s16(__rev1); 64132 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 64133 return __ret; 64134 } 64135 #endif 64136 64137 #ifdef __LITTLE_ENDIAN__ 64138 __ai __attribute__((target("neon"))) poly8x8_t vtrn1_p8(poly8x8_t __p0, poly8x8_t __p1) { 64139 poly8x8_t __ret; 64140 __ret = __builtin_shufflevector(__p0, __p1, 0, 8, 2, 10, 4, 12, 6, 14); 64141 return __ret; 64142 } 64143 #else 64144 __ai __attribute__((target("neon"))) poly8x8_t vtrn1_p8(poly8x8_t __p0, poly8x8_t __p1) { 64145 poly8x8_t __ret; 64146 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 64147 poly8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 64148 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 8, 2, 10, 4, 12, 6, 14); 64149 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 64150 return __ret; 64151 } 64152 #endif 64153 64154 #ifdef __LITTLE_ENDIAN__ 64155 __ai __attribute__((target("neon"))) poly16x4_t vtrn1_p16(poly16x4_t __p0, poly16x4_t __p1) { 64156 poly16x4_t __ret; 64157 __ret = __builtin_shufflevector(__p0, __p1, 0, 4, 2, 6); 64158 return __ret; 64159 } 64160 #else 64161 __ai __attribute__((target("neon"))) poly16x4_t vtrn1_p16(poly16x4_t __p0, poly16x4_t __p1) { 64162 poly16x4_t __ret; 64163 poly16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 64164 poly16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 64165 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 4, 2, 6); 64166 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 64167 return __ret; 64168 } 64169 #endif 64170 64171 #ifdef __LITTLE_ENDIAN__ 64172 __ai __attribute__((target("neon"))) poly8x16_t vtrn1q_p8(poly8x16_t __p0, poly8x16_t __p1) { 64173 poly8x16_t __ret; 64174 __ret = __builtin_shufflevector(__p0, __p1, 0, 16, 2, 18, 4, 20, 6, 22, 8, 24, 10, 26, 12, 28, 14, 30); 64175 return __ret; 64176 } 64177 #else 64178 __ai __attribute__((target("neon"))) poly8x16_t vtrn1q_p8(poly8x16_t __p0, poly8x16_t __p1) { 64179 poly8x16_t __ret; 64180 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 64181 poly8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 64182 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 16, 2, 18, 4, 20, 6, 22, 8, 24, 10, 26, 12, 28, 14, 30); 64183 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 64184 return __ret; 64185 } 64186 #endif 64187 64188 #ifdef __LITTLE_ENDIAN__ 64189 __ai __attribute__((target("neon"))) poly64x2_t vtrn1q_p64(poly64x2_t __p0, poly64x2_t __p1) { 64190 poly64x2_t __ret; 64191 __ret = __builtin_shufflevector(__p0, __p1, 0, 2); 64192 return __ret; 64193 } 64194 #else 64195 __ai __attribute__((target("neon"))) poly64x2_t vtrn1q_p64(poly64x2_t __p0, poly64x2_t __p1) { 64196 poly64x2_t __ret; 64197 poly64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 64198 poly64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 64199 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2); 64200 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 64201 return __ret; 64202 } 64203 #endif 64204 64205 #ifdef __LITTLE_ENDIAN__ 64206 __ai __attribute__((target("neon"))) poly16x8_t vtrn1q_p16(poly16x8_t __p0, poly16x8_t __p1) { 64207 poly16x8_t __ret; 64208 __ret = __builtin_shufflevector(__p0, __p1, 0, 8, 2, 10, 4, 12, 6, 14); 64209 return __ret; 64210 } 64211 #else 64212 __ai __attribute__((target("neon"))) poly16x8_t vtrn1q_p16(poly16x8_t __p0, poly16x8_t __p1) { 64213 poly16x8_t __ret; 64214 poly16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 64215 poly16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 64216 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 8, 2, 10, 4, 12, 6, 14); 64217 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 64218 return __ret; 64219 } 64220 #endif 64221 64222 #ifdef __LITTLE_ENDIAN__ 64223 __ai __attribute__((target("neon"))) uint8x16_t vtrn1q_u8(uint8x16_t __p0, uint8x16_t __p1) { 64224 uint8x16_t __ret; 64225 __ret = __builtin_shufflevector(__p0, __p1, 0, 16, 2, 18, 4, 20, 6, 22, 8, 24, 10, 26, 12, 28, 14, 30); 64226 return __ret; 64227 } 64228 #else 64229 __ai __attribute__((target("neon"))) uint8x16_t vtrn1q_u8(uint8x16_t __p0, uint8x16_t __p1) { 64230 uint8x16_t __ret; 64231 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 64232 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 64233 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 16, 2, 18, 4, 20, 6, 22, 8, 24, 10, 26, 12, 28, 14, 30); 64234 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 64235 return __ret; 64236 } 64237 #endif 64238 64239 #ifdef __LITTLE_ENDIAN__ 64240 __ai __attribute__((target("neon"))) uint32x4_t vtrn1q_u32(uint32x4_t __p0, uint32x4_t __p1) { 64241 uint32x4_t __ret; 64242 __ret = __builtin_shufflevector(__p0, __p1, 0, 4, 2, 6); 64243 return __ret; 64244 } 64245 #else 64246 __ai __attribute__((target("neon"))) uint32x4_t vtrn1q_u32(uint32x4_t __p0, uint32x4_t __p1) { 64247 uint32x4_t __ret; 64248 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 64249 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 64250 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 4, 2, 6); 64251 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 64252 return __ret; 64253 } 64254 #endif 64255 64256 #ifdef __LITTLE_ENDIAN__ 64257 __ai __attribute__((target("neon"))) uint64x2_t vtrn1q_u64(uint64x2_t __p0, uint64x2_t __p1) { 64258 uint64x2_t __ret; 64259 __ret = __builtin_shufflevector(__p0, __p1, 0, 2); 64260 return __ret; 64261 } 64262 #else 64263 __ai __attribute__((target("neon"))) uint64x2_t vtrn1q_u64(uint64x2_t __p0, uint64x2_t __p1) { 64264 uint64x2_t __ret; 64265 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 64266 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 64267 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2); 64268 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 64269 return __ret; 64270 } 64271 #endif 64272 64273 #ifdef __LITTLE_ENDIAN__ 64274 __ai __attribute__((target("neon"))) uint16x8_t vtrn1q_u16(uint16x8_t __p0, uint16x8_t __p1) { 64275 uint16x8_t __ret; 64276 __ret = __builtin_shufflevector(__p0, __p1, 0, 8, 2, 10, 4, 12, 6, 14); 64277 return __ret; 64278 } 64279 #else 64280 __ai __attribute__((target("neon"))) uint16x8_t vtrn1q_u16(uint16x8_t __p0, uint16x8_t __p1) { 64281 uint16x8_t __ret; 64282 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 64283 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 64284 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 8, 2, 10, 4, 12, 6, 14); 64285 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 64286 return __ret; 64287 } 64288 #endif 64289 64290 #ifdef __LITTLE_ENDIAN__ 64291 __ai __attribute__((target("neon"))) int8x16_t vtrn1q_s8(int8x16_t __p0, int8x16_t __p1) { 64292 int8x16_t __ret; 64293 __ret = __builtin_shufflevector(__p0, __p1, 0, 16, 2, 18, 4, 20, 6, 22, 8, 24, 10, 26, 12, 28, 14, 30); 64294 return __ret; 64295 } 64296 #else 64297 __ai __attribute__((target("neon"))) int8x16_t vtrn1q_s8(int8x16_t __p0, int8x16_t __p1) { 64298 int8x16_t __ret; 64299 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 64300 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 64301 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 16, 2, 18, 4, 20, 6, 22, 8, 24, 10, 26, 12, 28, 14, 30); 64302 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 64303 return __ret; 64304 } 64305 #endif 64306 64307 #ifdef __LITTLE_ENDIAN__ 64308 __ai __attribute__((target("neon"))) float64x2_t vtrn1q_f64(float64x2_t __p0, float64x2_t __p1) { 64309 float64x2_t __ret; 64310 __ret = __builtin_shufflevector(__p0, __p1, 0, 2); 64311 return __ret; 64312 } 64313 #else 64314 __ai __attribute__((target("neon"))) float64x2_t vtrn1q_f64(float64x2_t __p0, float64x2_t __p1) { 64315 float64x2_t __ret; 64316 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 64317 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 64318 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2); 64319 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 64320 return __ret; 64321 } 64322 #endif 64323 64324 #ifdef __LITTLE_ENDIAN__ 64325 __ai __attribute__((target("neon"))) float32x4_t vtrn1q_f32(float32x4_t __p0, float32x4_t __p1) { 64326 float32x4_t __ret; 64327 __ret = __builtin_shufflevector(__p0, __p1, 0, 4, 2, 6); 64328 return __ret; 64329 } 64330 #else 64331 __ai __attribute__((target("neon"))) float32x4_t vtrn1q_f32(float32x4_t __p0, float32x4_t __p1) { 64332 float32x4_t __ret; 64333 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 64334 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 64335 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 4, 2, 6); 64336 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 64337 return __ret; 64338 } 64339 #endif 64340 64341 #ifdef __LITTLE_ENDIAN__ 64342 __ai __attribute__((target("neon"))) int32x4_t vtrn1q_s32(int32x4_t __p0, int32x4_t __p1) { 64343 int32x4_t __ret; 64344 __ret = __builtin_shufflevector(__p0, __p1, 0, 4, 2, 6); 64345 return __ret; 64346 } 64347 #else 64348 __ai __attribute__((target("neon"))) int32x4_t vtrn1q_s32(int32x4_t __p0, int32x4_t __p1) { 64349 int32x4_t __ret; 64350 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 64351 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 64352 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 4, 2, 6); 64353 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 64354 return __ret; 64355 } 64356 #endif 64357 64358 #ifdef __LITTLE_ENDIAN__ 64359 __ai __attribute__((target("neon"))) int64x2_t vtrn1q_s64(int64x2_t __p0, int64x2_t __p1) { 64360 int64x2_t __ret; 64361 __ret = __builtin_shufflevector(__p0, __p1, 0, 2); 64362 return __ret; 64363 } 64364 #else 64365 __ai __attribute__((target("neon"))) int64x2_t vtrn1q_s64(int64x2_t __p0, int64x2_t __p1) { 64366 int64x2_t __ret; 64367 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 64368 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 64369 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2); 64370 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 64371 return __ret; 64372 } 64373 #endif 64374 64375 #ifdef __LITTLE_ENDIAN__ 64376 __ai __attribute__((target("neon"))) int16x8_t vtrn1q_s16(int16x8_t __p0, int16x8_t __p1) { 64377 int16x8_t __ret; 64378 __ret = __builtin_shufflevector(__p0, __p1, 0, 8, 2, 10, 4, 12, 6, 14); 64379 return __ret; 64380 } 64381 #else 64382 __ai __attribute__((target("neon"))) int16x8_t vtrn1q_s16(int16x8_t __p0, int16x8_t __p1) { 64383 int16x8_t __ret; 64384 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 64385 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 64386 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 8, 2, 10, 4, 12, 6, 14); 64387 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 64388 return __ret; 64389 } 64390 #endif 64391 64392 #ifdef __LITTLE_ENDIAN__ 64393 __ai __attribute__((target("neon"))) uint8x8_t vtrn1_u8(uint8x8_t __p0, uint8x8_t __p1) { 64394 uint8x8_t __ret; 64395 __ret = __builtin_shufflevector(__p0, __p1, 0, 8, 2, 10, 4, 12, 6, 14); 64396 return __ret; 64397 } 64398 #else 64399 __ai __attribute__((target("neon"))) uint8x8_t vtrn1_u8(uint8x8_t __p0, uint8x8_t __p1) { 64400 uint8x8_t __ret; 64401 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 64402 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 64403 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 8, 2, 10, 4, 12, 6, 14); 64404 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 64405 return __ret; 64406 } 64407 #endif 64408 64409 #ifdef __LITTLE_ENDIAN__ 64410 __ai __attribute__((target("neon"))) uint32x2_t vtrn1_u32(uint32x2_t __p0, uint32x2_t __p1) { 64411 uint32x2_t __ret; 64412 __ret = __builtin_shufflevector(__p0, __p1, 0, 2); 64413 return __ret; 64414 } 64415 #else 64416 __ai __attribute__((target("neon"))) uint32x2_t vtrn1_u32(uint32x2_t __p0, uint32x2_t __p1) { 64417 uint32x2_t __ret; 64418 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 64419 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 64420 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2); 64421 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 64422 return __ret; 64423 } 64424 #endif 64425 64426 #ifdef __LITTLE_ENDIAN__ 64427 __ai __attribute__((target("neon"))) uint16x4_t vtrn1_u16(uint16x4_t __p0, uint16x4_t __p1) { 64428 uint16x4_t __ret; 64429 __ret = __builtin_shufflevector(__p0, __p1, 0, 4, 2, 6); 64430 return __ret; 64431 } 64432 #else 64433 __ai __attribute__((target("neon"))) uint16x4_t vtrn1_u16(uint16x4_t __p0, uint16x4_t __p1) { 64434 uint16x4_t __ret; 64435 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 64436 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 64437 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 4, 2, 6); 64438 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 64439 return __ret; 64440 } 64441 #endif 64442 64443 #ifdef __LITTLE_ENDIAN__ 64444 __ai __attribute__((target("neon"))) int8x8_t vtrn1_s8(int8x8_t __p0, int8x8_t __p1) { 64445 int8x8_t __ret; 64446 __ret = __builtin_shufflevector(__p0, __p1, 0, 8, 2, 10, 4, 12, 6, 14); 64447 return __ret; 64448 } 64449 #else 64450 __ai __attribute__((target("neon"))) int8x8_t vtrn1_s8(int8x8_t __p0, int8x8_t __p1) { 64451 int8x8_t __ret; 64452 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 64453 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 64454 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 8, 2, 10, 4, 12, 6, 14); 64455 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 64456 return __ret; 64457 } 64458 #endif 64459 64460 #ifdef __LITTLE_ENDIAN__ 64461 __ai __attribute__((target("neon"))) float32x2_t vtrn1_f32(float32x2_t __p0, float32x2_t __p1) { 64462 float32x2_t __ret; 64463 __ret = __builtin_shufflevector(__p0, __p1, 0, 2); 64464 return __ret; 64465 } 64466 #else 64467 __ai __attribute__((target("neon"))) float32x2_t vtrn1_f32(float32x2_t __p0, float32x2_t __p1) { 64468 float32x2_t __ret; 64469 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 64470 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 64471 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2); 64472 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 64473 return __ret; 64474 } 64475 #endif 64476 64477 #ifdef __LITTLE_ENDIAN__ 64478 __ai __attribute__((target("neon"))) int32x2_t vtrn1_s32(int32x2_t __p0, int32x2_t __p1) { 64479 int32x2_t __ret; 64480 __ret = __builtin_shufflevector(__p0, __p1, 0, 2); 64481 return __ret; 64482 } 64483 #else 64484 __ai __attribute__((target("neon"))) int32x2_t vtrn1_s32(int32x2_t __p0, int32x2_t __p1) { 64485 int32x2_t __ret; 64486 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 64487 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 64488 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2); 64489 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 64490 return __ret; 64491 } 64492 #endif 64493 64494 #ifdef __LITTLE_ENDIAN__ 64495 __ai __attribute__((target("neon"))) int16x4_t vtrn1_s16(int16x4_t __p0, int16x4_t __p1) { 64496 int16x4_t __ret; 64497 __ret = __builtin_shufflevector(__p0, __p1, 0, 4, 2, 6); 64498 return __ret; 64499 } 64500 #else 64501 __ai __attribute__((target("neon"))) int16x4_t vtrn1_s16(int16x4_t __p0, int16x4_t __p1) { 64502 int16x4_t __ret; 64503 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 64504 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 64505 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 4, 2, 6); 64506 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 64507 return __ret; 64508 } 64509 #endif 64510 64511 #ifdef __LITTLE_ENDIAN__ 64512 __ai __attribute__((target("neon"))) float16x8_t vtrn1q_f16(float16x8_t __p0, float16x8_t __p1) { 64513 float16x8_t __ret; 64514 __ret = __builtin_shufflevector(__p0, __p1, 0, 8, 2, 10, 4, 12, 6, 14); 64515 return __ret; 64516 } 64517 #else 64518 __ai __attribute__((target("neon"))) float16x8_t vtrn1q_f16(float16x8_t __p0, float16x8_t __p1) { 64519 float16x8_t __ret; 64520 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 64521 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 64522 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 8, 2, 10, 4, 12, 6, 14); 64523 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 64524 return __ret; 64525 } 64526 #endif 64527 64528 #ifdef __LITTLE_ENDIAN__ 64529 __ai __attribute__((target("neon"))) float16x4_t vtrn1_f16(float16x4_t __p0, float16x4_t __p1) { 64530 float16x4_t __ret; 64531 __ret = __builtin_shufflevector(__p0, __p1, 0, 4, 2, 6); 64532 return __ret; 64533 } 64534 #else 64535 __ai __attribute__((target("neon"))) float16x4_t vtrn1_f16(float16x4_t __p0, float16x4_t __p1) { 64536 float16x4_t __ret; 64537 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 64538 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 64539 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 4, 2, 6); 64540 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 64541 return __ret; 64542 } 64543 #endif 64544 64545 #ifdef __LITTLE_ENDIAN__ 64546 __ai __attribute__((target("neon"))) poly8x8_t vtrn2_p8(poly8x8_t __p0, poly8x8_t __p1) { 64547 poly8x8_t __ret; 64548 __ret = __builtin_shufflevector(__p0, __p1, 1, 9, 3, 11, 5, 13, 7, 15); 64549 return __ret; 64550 } 64551 #else 64552 __ai __attribute__((target("neon"))) poly8x8_t vtrn2_p8(poly8x8_t __p0, poly8x8_t __p1) { 64553 poly8x8_t __ret; 64554 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 64555 poly8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 64556 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 9, 3, 11, 5, 13, 7, 15); 64557 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 64558 return __ret; 64559 } 64560 #endif 64561 64562 #ifdef __LITTLE_ENDIAN__ 64563 __ai __attribute__((target("neon"))) poly16x4_t vtrn2_p16(poly16x4_t __p0, poly16x4_t __p1) { 64564 poly16x4_t __ret; 64565 __ret = __builtin_shufflevector(__p0, __p1, 1, 5, 3, 7); 64566 return __ret; 64567 } 64568 #else 64569 __ai __attribute__((target("neon"))) poly16x4_t vtrn2_p16(poly16x4_t __p0, poly16x4_t __p1) { 64570 poly16x4_t __ret; 64571 poly16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 64572 poly16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 64573 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 5, 3, 7); 64574 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 64575 return __ret; 64576 } 64577 #endif 64578 64579 #ifdef __LITTLE_ENDIAN__ 64580 __ai __attribute__((target("neon"))) poly8x16_t vtrn2q_p8(poly8x16_t __p0, poly8x16_t __p1) { 64581 poly8x16_t __ret; 64582 __ret = __builtin_shufflevector(__p0, __p1, 1, 17, 3, 19, 5, 21, 7, 23, 9, 25, 11, 27, 13, 29, 15, 31); 64583 return __ret; 64584 } 64585 #else 64586 __ai __attribute__((target("neon"))) poly8x16_t vtrn2q_p8(poly8x16_t __p0, poly8x16_t __p1) { 64587 poly8x16_t __ret; 64588 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 64589 poly8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 64590 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 17, 3, 19, 5, 21, 7, 23, 9, 25, 11, 27, 13, 29, 15, 31); 64591 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 64592 return __ret; 64593 } 64594 #endif 64595 64596 #ifdef __LITTLE_ENDIAN__ 64597 __ai __attribute__((target("neon"))) poly64x2_t vtrn2q_p64(poly64x2_t __p0, poly64x2_t __p1) { 64598 poly64x2_t __ret; 64599 __ret = __builtin_shufflevector(__p0, __p1, 1, 3); 64600 return __ret; 64601 } 64602 #else 64603 __ai __attribute__((target("neon"))) poly64x2_t vtrn2q_p64(poly64x2_t __p0, poly64x2_t __p1) { 64604 poly64x2_t __ret; 64605 poly64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 64606 poly64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 64607 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3); 64608 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 64609 return __ret; 64610 } 64611 #endif 64612 64613 #ifdef __LITTLE_ENDIAN__ 64614 __ai __attribute__((target("neon"))) poly16x8_t vtrn2q_p16(poly16x8_t __p0, poly16x8_t __p1) { 64615 poly16x8_t __ret; 64616 __ret = __builtin_shufflevector(__p0, __p1, 1, 9, 3, 11, 5, 13, 7, 15); 64617 return __ret; 64618 } 64619 #else 64620 __ai __attribute__((target("neon"))) poly16x8_t vtrn2q_p16(poly16x8_t __p0, poly16x8_t __p1) { 64621 poly16x8_t __ret; 64622 poly16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 64623 poly16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 64624 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 9, 3, 11, 5, 13, 7, 15); 64625 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 64626 return __ret; 64627 } 64628 #endif 64629 64630 #ifdef __LITTLE_ENDIAN__ 64631 __ai __attribute__((target("neon"))) uint8x16_t vtrn2q_u8(uint8x16_t __p0, uint8x16_t __p1) { 64632 uint8x16_t __ret; 64633 __ret = __builtin_shufflevector(__p0, __p1, 1, 17, 3, 19, 5, 21, 7, 23, 9, 25, 11, 27, 13, 29, 15, 31); 64634 return __ret; 64635 } 64636 #else 64637 __ai __attribute__((target("neon"))) uint8x16_t vtrn2q_u8(uint8x16_t __p0, uint8x16_t __p1) { 64638 uint8x16_t __ret; 64639 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 64640 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 64641 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 17, 3, 19, 5, 21, 7, 23, 9, 25, 11, 27, 13, 29, 15, 31); 64642 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 64643 return __ret; 64644 } 64645 #endif 64646 64647 #ifdef __LITTLE_ENDIAN__ 64648 __ai __attribute__((target("neon"))) uint32x4_t vtrn2q_u32(uint32x4_t __p0, uint32x4_t __p1) { 64649 uint32x4_t __ret; 64650 __ret = __builtin_shufflevector(__p0, __p1, 1, 5, 3, 7); 64651 return __ret; 64652 } 64653 #else 64654 __ai __attribute__((target("neon"))) uint32x4_t vtrn2q_u32(uint32x4_t __p0, uint32x4_t __p1) { 64655 uint32x4_t __ret; 64656 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 64657 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 64658 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 5, 3, 7); 64659 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 64660 return __ret; 64661 } 64662 #endif 64663 64664 #ifdef __LITTLE_ENDIAN__ 64665 __ai __attribute__((target("neon"))) uint64x2_t vtrn2q_u64(uint64x2_t __p0, uint64x2_t __p1) { 64666 uint64x2_t __ret; 64667 __ret = __builtin_shufflevector(__p0, __p1, 1, 3); 64668 return __ret; 64669 } 64670 #else 64671 __ai __attribute__((target("neon"))) uint64x2_t vtrn2q_u64(uint64x2_t __p0, uint64x2_t __p1) { 64672 uint64x2_t __ret; 64673 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 64674 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 64675 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3); 64676 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 64677 return __ret; 64678 } 64679 #endif 64680 64681 #ifdef __LITTLE_ENDIAN__ 64682 __ai __attribute__((target("neon"))) uint16x8_t vtrn2q_u16(uint16x8_t __p0, uint16x8_t __p1) { 64683 uint16x8_t __ret; 64684 __ret = __builtin_shufflevector(__p0, __p1, 1, 9, 3, 11, 5, 13, 7, 15); 64685 return __ret; 64686 } 64687 #else 64688 __ai __attribute__((target("neon"))) uint16x8_t vtrn2q_u16(uint16x8_t __p0, uint16x8_t __p1) { 64689 uint16x8_t __ret; 64690 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 64691 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 64692 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 9, 3, 11, 5, 13, 7, 15); 64693 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 64694 return __ret; 64695 } 64696 #endif 64697 64698 #ifdef __LITTLE_ENDIAN__ 64699 __ai __attribute__((target("neon"))) int8x16_t vtrn2q_s8(int8x16_t __p0, int8x16_t __p1) { 64700 int8x16_t __ret; 64701 __ret = __builtin_shufflevector(__p0, __p1, 1, 17, 3, 19, 5, 21, 7, 23, 9, 25, 11, 27, 13, 29, 15, 31); 64702 return __ret; 64703 } 64704 #else 64705 __ai __attribute__((target("neon"))) int8x16_t vtrn2q_s8(int8x16_t __p0, int8x16_t __p1) { 64706 int8x16_t __ret; 64707 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 64708 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 64709 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 17, 3, 19, 5, 21, 7, 23, 9, 25, 11, 27, 13, 29, 15, 31); 64710 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 64711 return __ret; 64712 } 64713 #endif 64714 64715 #ifdef __LITTLE_ENDIAN__ 64716 __ai __attribute__((target("neon"))) float64x2_t vtrn2q_f64(float64x2_t __p0, float64x2_t __p1) { 64717 float64x2_t __ret; 64718 __ret = __builtin_shufflevector(__p0, __p1, 1, 3); 64719 return __ret; 64720 } 64721 #else 64722 __ai __attribute__((target("neon"))) float64x2_t vtrn2q_f64(float64x2_t __p0, float64x2_t __p1) { 64723 float64x2_t __ret; 64724 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 64725 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 64726 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3); 64727 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 64728 return __ret; 64729 } 64730 #endif 64731 64732 #ifdef __LITTLE_ENDIAN__ 64733 __ai __attribute__((target("neon"))) float32x4_t vtrn2q_f32(float32x4_t __p0, float32x4_t __p1) { 64734 float32x4_t __ret; 64735 __ret = __builtin_shufflevector(__p0, __p1, 1, 5, 3, 7); 64736 return __ret; 64737 } 64738 #else 64739 __ai __attribute__((target("neon"))) float32x4_t vtrn2q_f32(float32x4_t __p0, float32x4_t __p1) { 64740 float32x4_t __ret; 64741 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 64742 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 64743 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 5, 3, 7); 64744 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 64745 return __ret; 64746 } 64747 #endif 64748 64749 #ifdef __LITTLE_ENDIAN__ 64750 __ai __attribute__((target("neon"))) int32x4_t vtrn2q_s32(int32x4_t __p0, int32x4_t __p1) { 64751 int32x4_t __ret; 64752 __ret = __builtin_shufflevector(__p0, __p1, 1, 5, 3, 7); 64753 return __ret; 64754 } 64755 #else 64756 __ai __attribute__((target("neon"))) int32x4_t vtrn2q_s32(int32x4_t __p0, int32x4_t __p1) { 64757 int32x4_t __ret; 64758 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 64759 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 64760 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 5, 3, 7); 64761 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 64762 return __ret; 64763 } 64764 #endif 64765 64766 #ifdef __LITTLE_ENDIAN__ 64767 __ai __attribute__((target("neon"))) int64x2_t vtrn2q_s64(int64x2_t __p0, int64x2_t __p1) { 64768 int64x2_t __ret; 64769 __ret = __builtin_shufflevector(__p0, __p1, 1, 3); 64770 return __ret; 64771 } 64772 #else 64773 __ai __attribute__((target("neon"))) int64x2_t vtrn2q_s64(int64x2_t __p0, int64x2_t __p1) { 64774 int64x2_t __ret; 64775 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 64776 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 64777 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3); 64778 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 64779 return __ret; 64780 } 64781 #endif 64782 64783 #ifdef __LITTLE_ENDIAN__ 64784 __ai __attribute__((target("neon"))) int16x8_t vtrn2q_s16(int16x8_t __p0, int16x8_t __p1) { 64785 int16x8_t __ret; 64786 __ret = __builtin_shufflevector(__p0, __p1, 1, 9, 3, 11, 5, 13, 7, 15); 64787 return __ret; 64788 } 64789 #else 64790 __ai __attribute__((target("neon"))) int16x8_t vtrn2q_s16(int16x8_t __p0, int16x8_t __p1) { 64791 int16x8_t __ret; 64792 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 64793 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 64794 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 9, 3, 11, 5, 13, 7, 15); 64795 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 64796 return __ret; 64797 } 64798 #endif 64799 64800 #ifdef __LITTLE_ENDIAN__ 64801 __ai __attribute__((target("neon"))) uint8x8_t vtrn2_u8(uint8x8_t __p0, uint8x8_t __p1) { 64802 uint8x8_t __ret; 64803 __ret = __builtin_shufflevector(__p0, __p1, 1, 9, 3, 11, 5, 13, 7, 15); 64804 return __ret; 64805 } 64806 #else 64807 __ai __attribute__((target("neon"))) uint8x8_t vtrn2_u8(uint8x8_t __p0, uint8x8_t __p1) { 64808 uint8x8_t __ret; 64809 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 64810 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 64811 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 9, 3, 11, 5, 13, 7, 15); 64812 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 64813 return __ret; 64814 } 64815 #endif 64816 64817 #ifdef __LITTLE_ENDIAN__ 64818 __ai __attribute__((target("neon"))) uint32x2_t vtrn2_u32(uint32x2_t __p0, uint32x2_t __p1) { 64819 uint32x2_t __ret; 64820 __ret = __builtin_shufflevector(__p0, __p1, 1, 3); 64821 return __ret; 64822 } 64823 #else 64824 __ai __attribute__((target("neon"))) uint32x2_t vtrn2_u32(uint32x2_t __p0, uint32x2_t __p1) { 64825 uint32x2_t __ret; 64826 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 64827 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 64828 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3); 64829 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 64830 return __ret; 64831 } 64832 #endif 64833 64834 #ifdef __LITTLE_ENDIAN__ 64835 __ai __attribute__((target("neon"))) uint16x4_t vtrn2_u16(uint16x4_t __p0, uint16x4_t __p1) { 64836 uint16x4_t __ret; 64837 __ret = __builtin_shufflevector(__p0, __p1, 1, 5, 3, 7); 64838 return __ret; 64839 } 64840 #else 64841 __ai __attribute__((target("neon"))) uint16x4_t vtrn2_u16(uint16x4_t __p0, uint16x4_t __p1) { 64842 uint16x4_t __ret; 64843 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 64844 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 64845 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 5, 3, 7); 64846 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 64847 return __ret; 64848 } 64849 #endif 64850 64851 #ifdef __LITTLE_ENDIAN__ 64852 __ai __attribute__((target("neon"))) int8x8_t vtrn2_s8(int8x8_t __p0, int8x8_t __p1) { 64853 int8x8_t __ret; 64854 __ret = __builtin_shufflevector(__p0, __p1, 1, 9, 3, 11, 5, 13, 7, 15); 64855 return __ret; 64856 } 64857 #else 64858 __ai __attribute__((target("neon"))) int8x8_t vtrn2_s8(int8x8_t __p0, int8x8_t __p1) { 64859 int8x8_t __ret; 64860 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 64861 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 64862 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 9, 3, 11, 5, 13, 7, 15); 64863 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 64864 return __ret; 64865 } 64866 #endif 64867 64868 #ifdef __LITTLE_ENDIAN__ 64869 __ai __attribute__((target("neon"))) float32x2_t vtrn2_f32(float32x2_t __p0, float32x2_t __p1) { 64870 float32x2_t __ret; 64871 __ret = __builtin_shufflevector(__p0, __p1, 1, 3); 64872 return __ret; 64873 } 64874 #else 64875 __ai __attribute__((target("neon"))) float32x2_t vtrn2_f32(float32x2_t __p0, float32x2_t __p1) { 64876 float32x2_t __ret; 64877 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 64878 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 64879 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3); 64880 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 64881 return __ret; 64882 } 64883 #endif 64884 64885 #ifdef __LITTLE_ENDIAN__ 64886 __ai __attribute__((target("neon"))) int32x2_t vtrn2_s32(int32x2_t __p0, int32x2_t __p1) { 64887 int32x2_t __ret; 64888 __ret = __builtin_shufflevector(__p0, __p1, 1, 3); 64889 return __ret; 64890 } 64891 #else 64892 __ai __attribute__((target("neon"))) int32x2_t vtrn2_s32(int32x2_t __p0, int32x2_t __p1) { 64893 int32x2_t __ret; 64894 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 64895 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 64896 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3); 64897 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 64898 return __ret; 64899 } 64900 #endif 64901 64902 #ifdef __LITTLE_ENDIAN__ 64903 __ai __attribute__((target("neon"))) int16x4_t vtrn2_s16(int16x4_t __p0, int16x4_t __p1) { 64904 int16x4_t __ret; 64905 __ret = __builtin_shufflevector(__p0, __p1, 1, 5, 3, 7); 64906 return __ret; 64907 } 64908 #else 64909 __ai __attribute__((target("neon"))) int16x4_t vtrn2_s16(int16x4_t __p0, int16x4_t __p1) { 64910 int16x4_t __ret; 64911 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 64912 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 64913 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 5, 3, 7); 64914 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 64915 return __ret; 64916 } 64917 #endif 64918 64919 #ifdef __LITTLE_ENDIAN__ 64920 __ai __attribute__((target("neon"))) float16x8_t vtrn2q_f16(float16x8_t __p0, float16x8_t __p1) { 64921 float16x8_t __ret; 64922 __ret = __builtin_shufflevector(__p0, __p1, 1, 9, 3, 11, 5, 13, 7, 15); 64923 return __ret; 64924 } 64925 #else 64926 __ai __attribute__((target("neon"))) float16x8_t vtrn2q_f16(float16x8_t __p0, float16x8_t __p1) { 64927 float16x8_t __ret; 64928 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 64929 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 64930 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 9, 3, 11, 5, 13, 7, 15); 64931 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 64932 return __ret; 64933 } 64934 #endif 64935 64936 #ifdef __LITTLE_ENDIAN__ 64937 __ai __attribute__((target("neon"))) float16x4_t vtrn2_f16(float16x4_t __p0, float16x4_t __p1) { 64938 float16x4_t __ret; 64939 __ret = __builtin_shufflevector(__p0, __p1, 1, 5, 3, 7); 64940 return __ret; 64941 } 64942 #else 64943 __ai __attribute__((target("neon"))) float16x4_t vtrn2_f16(float16x4_t __p0, float16x4_t __p1) { 64944 float16x4_t __ret; 64945 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 64946 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 64947 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 5, 3, 7); 64948 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 64949 return __ret; 64950 } 64951 #endif 64952 64953 __ai __attribute__((target("neon"))) uint64x1_t vtst_p64(poly64x1_t __p0, poly64x1_t __p1) { 64954 uint64x1_t __ret; 64955 __ret = (uint64x1_t) __builtin_neon_vtst_v((int8x8_t)__p0, (int8x8_t)__p1, 19); 64956 return __ret; 64957 } 64958 #ifdef __LITTLE_ENDIAN__ 64959 __ai __attribute__((target("neon"))) uint64x2_t vtstq_p64(poly64x2_t __p0, poly64x2_t __p1) { 64960 uint64x2_t __ret; 64961 __ret = (uint64x2_t) __builtin_neon_vtstq_v((int8x16_t)__p0, (int8x16_t)__p1, 51); 64962 return __ret; 64963 } 64964 #else 64965 __ai __attribute__((target("neon"))) uint64x2_t vtstq_p64(poly64x2_t __p0, poly64x2_t __p1) { 64966 uint64x2_t __ret; 64967 poly64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 64968 poly64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 64969 __ret = (uint64x2_t) __builtin_neon_vtstq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 51); 64970 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 64971 return __ret; 64972 } 64973 #endif 64974 64975 #ifdef __LITTLE_ENDIAN__ 64976 __ai __attribute__((target("neon"))) uint64x2_t vtstq_u64(uint64x2_t __p0, uint64x2_t __p1) { 64977 uint64x2_t __ret; 64978 __ret = (uint64x2_t) __builtin_neon_vtstq_v((int8x16_t)__p0, (int8x16_t)__p1, 51); 64979 return __ret; 64980 } 64981 #else 64982 __ai __attribute__((target("neon"))) uint64x2_t vtstq_u64(uint64x2_t __p0, uint64x2_t __p1) { 64983 uint64x2_t __ret; 64984 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 64985 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 64986 __ret = (uint64x2_t) __builtin_neon_vtstq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 51); 64987 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 64988 return __ret; 64989 } 64990 #endif 64991 64992 #ifdef __LITTLE_ENDIAN__ 64993 __ai __attribute__((target("neon"))) uint64x2_t vtstq_s64(int64x2_t __p0, int64x2_t __p1) { 64994 uint64x2_t __ret; 64995 __ret = (uint64x2_t) __builtin_neon_vtstq_v((int8x16_t)__p0, (int8x16_t)__p1, 51); 64996 return __ret; 64997 } 64998 #else 64999 __ai __attribute__((target("neon"))) uint64x2_t vtstq_s64(int64x2_t __p0, int64x2_t __p1) { 65000 uint64x2_t __ret; 65001 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 65002 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 65003 __ret = (uint64x2_t) __builtin_neon_vtstq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 51); 65004 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 65005 return __ret; 65006 } 65007 #endif 65008 65009 __ai __attribute__((target("neon"))) uint64x1_t vtst_u64(uint64x1_t __p0, uint64x1_t __p1) { 65010 uint64x1_t __ret; 65011 __ret = (uint64x1_t) __builtin_neon_vtst_v((int8x8_t)__p0, (int8x8_t)__p1, 19); 65012 return __ret; 65013 } 65014 __ai __attribute__((target("neon"))) uint64x1_t vtst_s64(int64x1_t __p0, int64x1_t __p1) { 65015 uint64x1_t __ret; 65016 __ret = (uint64x1_t) __builtin_neon_vtst_v((int8x8_t)__p0, (int8x8_t)__p1, 19); 65017 return __ret; 65018 } 65019 __ai __attribute__((target("neon"))) uint64_t vtstd_u64(uint64_t __p0, uint64_t __p1) { 65020 uint64_t __ret; 65021 __ret = (uint64_t) __builtin_neon_vtstd_u64(__p0, __p1); 65022 return __ret; 65023 } 65024 __ai __attribute__((target("neon"))) uint64_t vtstd_s64(int64_t __p0, int64_t __p1) { 65025 uint64_t __ret; 65026 __ret = (uint64_t) __builtin_neon_vtstd_s64(__p0, __p1); 65027 return __ret; 65028 } 65029 __ai __attribute__((target("neon"))) int8_t vuqaddb_s8(int8_t __p0, uint8_t __p1) { 65030 int8_t __ret; 65031 __ret = (int8_t) __builtin_neon_vuqaddb_s8(__p0, __p1); 65032 return __ret; 65033 } 65034 __ai __attribute__((target("neon"))) int32_t vuqadds_s32(int32_t __p0, uint32_t __p1) { 65035 int32_t __ret; 65036 __ret = (int32_t) __builtin_neon_vuqadds_s32(__p0, __p1); 65037 return __ret; 65038 } 65039 __ai __attribute__((target("neon"))) int64_t vuqaddd_s64(int64_t __p0, uint64_t __p1) { 65040 int64_t __ret; 65041 __ret = (int64_t) __builtin_neon_vuqaddd_s64(__p0, __p1); 65042 return __ret; 65043 } 65044 __ai __attribute__((target("neon"))) int16_t vuqaddh_s16(int16_t __p0, uint16_t __p1) { 65045 int16_t __ret; 65046 __ret = (int16_t) __builtin_neon_vuqaddh_s16(__p0, __p1); 65047 return __ret; 65048 } 65049 #ifdef __LITTLE_ENDIAN__ 65050 __ai __attribute__((target("neon"))) int8x16_t vuqaddq_s8(int8x16_t __p0, uint8x16_t __p1) { 65051 int8x16_t __ret; 65052 __ret = (int8x16_t) __builtin_neon_vuqaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 32); 65053 return __ret; 65054 } 65055 #else 65056 __ai __attribute__((target("neon"))) int8x16_t vuqaddq_s8(int8x16_t __p0, uint8x16_t __p1) { 65057 int8x16_t __ret; 65058 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 65059 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 65060 __ret = (int8x16_t) __builtin_neon_vuqaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 32); 65061 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 65062 return __ret; 65063 } 65064 #endif 65065 65066 #ifdef __LITTLE_ENDIAN__ 65067 __ai __attribute__((target("neon"))) int32x4_t vuqaddq_s32(int32x4_t __p0, uint32x4_t __p1) { 65068 int32x4_t __ret; 65069 __ret = (int32x4_t) __builtin_neon_vuqaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 34); 65070 return __ret; 65071 } 65072 #else 65073 __ai __attribute__((target("neon"))) int32x4_t vuqaddq_s32(int32x4_t __p0, uint32x4_t __p1) { 65074 int32x4_t __ret; 65075 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 65076 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 65077 __ret = (int32x4_t) __builtin_neon_vuqaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 34); 65078 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 65079 return __ret; 65080 } 65081 #endif 65082 65083 #ifdef __LITTLE_ENDIAN__ 65084 __ai __attribute__((target("neon"))) int64x2_t vuqaddq_s64(int64x2_t __p0, uint64x2_t __p1) { 65085 int64x2_t __ret; 65086 __ret = (int64x2_t) __builtin_neon_vuqaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 35); 65087 return __ret; 65088 } 65089 #else 65090 __ai __attribute__((target("neon"))) int64x2_t vuqaddq_s64(int64x2_t __p0, uint64x2_t __p1) { 65091 int64x2_t __ret; 65092 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 65093 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 65094 __ret = (int64x2_t) __builtin_neon_vuqaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 35); 65095 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 65096 return __ret; 65097 } 65098 #endif 65099 65100 #ifdef __LITTLE_ENDIAN__ 65101 __ai __attribute__((target("neon"))) int16x8_t vuqaddq_s16(int16x8_t __p0, uint16x8_t __p1) { 65102 int16x8_t __ret; 65103 __ret = (int16x8_t) __builtin_neon_vuqaddq_v((int8x16_t)__p0, (int8x16_t)__p1, 33); 65104 return __ret; 65105 } 65106 #else 65107 __ai __attribute__((target("neon"))) int16x8_t vuqaddq_s16(int16x8_t __p0, uint16x8_t __p1) { 65108 int16x8_t __ret; 65109 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 65110 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 65111 __ret = (int16x8_t) __builtin_neon_vuqaddq_v((int8x16_t)__rev0, (int8x16_t)__rev1, 33); 65112 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 65113 return __ret; 65114 } 65115 #endif 65116 65117 #ifdef __LITTLE_ENDIAN__ 65118 __ai __attribute__((target("neon"))) int8x8_t vuqadd_s8(int8x8_t __p0, uint8x8_t __p1) { 65119 int8x8_t __ret; 65120 __ret = (int8x8_t) __builtin_neon_vuqadd_v((int8x8_t)__p0, (int8x8_t)__p1, 0); 65121 return __ret; 65122 } 65123 #else 65124 __ai __attribute__((target("neon"))) int8x8_t vuqadd_s8(int8x8_t __p0, uint8x8_t __p1) { 65125 int8x8_t __ret; 65126 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 65127 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 65128 __ret = (int8x8_t) __builtin_neon_vuqadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 0); 65129 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 65130 return __ret; 65131 } 65132 #endif 65133 65134 #ifdef __LITTLE_ENDIAN__ 65135 __ai __attribute__((target("neon"))) int32x2_t vuqadd_s32(int32x2_t __p0, uint32x2_t __p1) { 65136 int32x2_t __ret; 65137 __ret = (int32x2_t) __builtin_neon_vuqadd_v((int8x8_t)__p0, (int8x8_t)__p1, 2); 65138 return __ret; 65139 } 65140 #else 65141 __ai __attribute__((target("neon"))) int32x2_t vuqadd_s32(int32x2_t __p0, uint32x2_t __p1) { 65142 int32x2_t __ret; 65143 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 65144 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 65145 __ret = (int32x2_t) __builtin_neon_vuqadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 2); 65146 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 65147 return __ret; 65148 } 65149 #endif 65150 65151 __ai __attribute__((target("neon"))) int64x1_t vuqadd_s64(int64x1_t __p0, uint64x1_t __p1) { 65152 int64x1_t __ret; 65153 __ret = (int64x1_t) __builtin_neon_vuqadd_v((int8x8_t)__p0, (int8x8_t)__p1, 3); 65154 return __ret; 65155 } 65156 #ifdef __LITTLE_ENDIAN__ 65157 __ai __attribute__((target("neon"))) int16x4_t vuqadd_s16(int16x4_t __p0, uint16x4_t __p1) { 65158 int16x4_t __ret; 65159 __ret = (int16x4_t) __builtin_neon_vuqadd_v((int8x8_t)__p0, (int8x8_t)__p1, 1); 65160 return __ret; 65161 } 65162 #else 65163 __ai __attribute__((target("neon"))) int16x4_t vuqadd_s16(int16x4_t __p0, uint16x4_t __p1) { 65164 int16x4_t __ret; 65165 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 65166 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 65167 __ret = (int16x4_t) __builtin_neon_vuqadd_v((int8x8_t)__rev0, (int8x8_t)__rev1, 1); 65168 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 65169 return __ret; 65170 } 65171 #endif 65172 65173 #ifdef __LITTLE_ENDIAN__ 65174 __ai __attribute__((target("neon"))) poly8x8_t vuzp1_p8(poly8x8_t __p0, poly8x8_t __p1) { 65175 poly8x8_t __ret; 65176 __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6, 8, 10, 12, 14); 65177 return __ret; 65178 } 65179 #else 65180 __ai __attribute__((target("neon"))) poly8x8_t vuzp1_p8(poly8x8_t __p0, poly8x8_t __p1) { 65181 poly8x8_t __ret; 65182 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 65183 poly8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 65184 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6, 8, 10, 12, 14); 65185 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 65186 return __ret; 65187 } 65188 #endif 65189 65190 #ifdef __LITTLE_ENDIAN__ 65191 __ai __attribute__((target("neon"))) poly16x4_t vuzp1_p16(poly16x4_t __p0, poly16x4_t __p1) { 65192 poly16x4_t __ret; 65193 __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6); 65194 return __ret; 65195 } 65196 #else 65197 __ai __attribute__((target("neon"))) poly16x4_t vuzp1_p16(poly16x4_t __p0, poly16x4_t __p1) { 65198 poly16x4_t __ret; 65199 poly16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 65200 poly16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 65201 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6); 65202 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 65203 return __ret; 65204 } 65205 #endif 65206 65207 #ifdef __LITTLE_ENDIAN__ 65208 __ai __attribute__((target("neon"))) poly8x16_t vuzp1q_p8(poly8x16_t __p0, poly8x16_t __p1) { 65209 poly8x16_t __ret; 65210 __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6, 8, 10, 12, 14, 16, 18, 20, 22, 24, 26, 28, 30); 65211 return __ret; 65212 } 65213 #else 65214 __ai __attribute__((target("neon"))) poly8x16_t vuzp1q_p8(poly8x16_t __p0, poly8x16_t __p1) { 65215 poly8x16_t __ret; 65216 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 65217 poly8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 65218 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6, 8, 10, 12, 14, 16, 18, 20, 22, 24, 26, 28, 30); 65219 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 65220 return __ret; 65221 } 65222 #endif 65223 65224 #ifdef __LITTLE_ENDIAN__ 65225 __ai __attribute__((target("neon"))) poly64x2_t vuzp1q_p64(poly64x2_t __p0, poly64x2_t __p1) { 65226 poly64x2_t __ret; 65227 __ret = __builtin_shufflevector(__p0, __p1, 0, 2); 65228 return __ret; 65229 } 65230 #else 65231 __ai __attribute__((target("neon"))) poly64x2_t vuzp1q_p64(poly64x2_t __p0, poly64x2_t __p1) { 65232 poly64x2_t __ret; 65233 poly64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 65234 poly64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 65235 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2); 65236 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 65237 return __ret; 65238 } 65239 #endif 65240 65241 #ifdef __LITTLE_ENDIAN__ 65242 __ai __attribute__((target("neon"))) poly16x8_t vuzp1q_p16(poly16x8_t __p0, poly16x8_t __p1) { 65243 poly16x8_t __ret; 65244 __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6, 8, 10, 12, 14); 65245 return __ret; 65246 } 65247 #else 65248 __ai __attribute__((target("neon"))) poly16x8_t vuzp1q_p16(poly16x8_t __p0, poly16x8_t __p1) { 65249 poly16x8_t __ret; 65250 poly16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 65251 poly16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 65252 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6, 8, 10, 12, 14); 65253 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 65254 return __ret; 65255 } 65256 #endif 65257 65258 #ifdef __LITTLE_ENDIAN__ 65259 __ai __attribute__((target("neon"))) uint8x16_t vuzp1q_u8(uint8x16_t __p0, uint8x16_t __p1) { 65260 uint8x16_t __ret; 65261 __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6, 8, 10, 12, 14, 16, 18, 20, 22, 24, 26, 28, 30); 65262 return __ret; 65263 } 65264 #else 65265 __ai __attribute__((target("neon"))) uint8x16_t vuzp1q_u8(uint8x16_t __p0, uint8x16_t __p1) { 65266 uint8x16_t __ret; 65267 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 65268 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 65269 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6, 8, 10, 12, 14, 16, 18, 20, 22, 24, 26, 28, 30); 65270 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 65271 return __ret; 65272 } 65273 #endif 65274 65275 #ifdef __LITTLE_ENDIAN__ 65276 __ai __attribute__((target("neon"))) uint32x4_t vuzp1q_u32(uint32x4_t __p0, uint32x4_t __p1) { 65277 uint32x4_t __ret; 65278 __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6); 65279 return __ret; 65280 } 65281 #else 65282 __ai __attribute__((target("neon"))) uint32x4_t vuzp1q_u32(uint32x4_t __p0, uint32x4_t __p1) { 65283 uint32x4_t __ret; 65284 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 65285 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 65286 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6); 65287 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 65288 return __ret; 65289 } 65290 #endif 65291 65292 #ifdef __LITTLE_ENDIAN__ 65293 __ai __attribute__((target("neon"))) uint64x2_t vuzp1q_u64(uint64x2_t __p0, uint64x2_t __p1) { 65294 uint64x2_t __ret; 65295 __ret = __builtin_shufflevector(__p0, __p1, 0, 2); 65296 return __ret; 65297 } 65298 #else 65299 __ai __attribute__((target("neon"))) uint64x2_t vuzp1q_u64(uint64x2_t __p0, uint64x2_t __p1) { 65300 uint64x2_t __ret; 65301 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 65302 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 65303 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2); 65304 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 65305 return __ret; 65306 } 65307 #endif 65308 65309 #ifdef __LITTLE_ENDIAN__ 65310 __ai __attribute__((target("neon"))) uint16x8_t vuzp1q_u16(uint16x8_t __p0, uint16x8_t __p1) { 65311 uint16x8_t __ret; 65312 __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6, 8, 10, 12, 14); 65313 return __ret; 65314 } 65315 #else 65316 __ai __attribute__((target("neon"))) uint16x8_t vuzp1q_u16(uint16x8_t __p0, uint16x8_t __p1) { 65317 uint16x8_t __ret; 65318 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 65319 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 65320 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6, 8, 10, 12, 14); 65321 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 65322 return __ret; 65323 } 65324 #endif 65325 65326 #ifdef __LITTLE_ENDIAN__ 65327 __ai __attribute__((target("neon"))) int8x16_t vuzp1q_s8(int8x16_t __p0, int8x16_t __p1) { 65328 int8x16_t __ret; 65329 __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6, 8, 10, 12, 14, 16, 18, 20, 22, 24, 26, 28, 30); 65330 return __ret; 65331 } 65332 #else 65333 __ai __attribute__((target("neon"))) int8x16_t vuzp1q_s8(int8x16_t __p0, int8x16_t __p1) { 65334 int8x16_t __ret; 65335 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 65336 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 65337 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6, 8, 10, 12, 14, 16, 18, 20, 22, 24, 26, 28, 30); 65338 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 65339 return __ret; 65340 } 65341 #endif 65342 65343 #ifdef __LITTLE_ENDIAN__ 65344 __ai __attribute__((target("neon"))) float64x2_t vuzp1q_f64(float64x2_t __p0, float64x2_t __p1) { 65345 float64x2_t __ret; 65346 __ret = __builtin_shufflevector(__p0, __p1, 0, 2); 65347 return __ret; 65348 } 65349 #else 65350 __ai __attribute__((target("neon"))) float64x2_t vuzp1q_f64(float64x2_t __p0, float64x2_t __p1) { 65351 float64x2_t __ret; 65352 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 65353 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 65354 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2); 65355 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 65356 return __ret; 65357 } 65358 #endif 65359 65360 #ifdef __LITTLE_ENDIAN__ 65361 __ai __attribute__((target("neon"))) float32x4_t vuzp1q_f32(float32x4_t __p0, float32x4_t __p1) { 65362 float32x4_t __ret; 65363 __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6); 65364 return __ret; 65365 } 65366 #else 65367 __ai __attribute__((target("neon"))) float32x4_t vuzp1q_f32(float32x4_t __p0, float32x4_t __p1) { 65368 float32x4_t __ret; 65369 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 65370 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 65371 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6); 65372 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 65373 return __ret; 65374 } 65375 #endif 65376 65377 #ifdef __LITTLE_ENDIAN__ 65378 __ai __attribute__((target("neon"))) int32x4_t vuzp1q_s32(int32x4_t __p0, int32x4_t __p1) { 65379 int32x4_t __ret; 65380 __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6); 65381 return __ret; 65382 } 65383 #else 65384 __ai __attribute__((target("neon"))) int32x4_t vuzp1q_s32(int32x4_t __p0, int32x4_t __p1) { 65385 int32x4_t __ret; 65386 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 65387 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 65388 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6); 65389 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 65390 return __ret; 65391 } 65392 #endif 65393 65394 #ifdef __LITTLE_ENDIAN__ 65395 __ai __attribute__((target("neon"))) int64x2_t vuzp1q_s64(int64x2_t __p0, int64x2_t __p1) { 65396 int64x2_t __ret; 65397 __ret = __builtin_shufflevector(__p0, __p1, 0, 2); 65398 return __ret; 65399 } 65400 #else 65401 __ai __attribute__((target("neon"))) int64x2_t vuzp1q_s64(int64x2_t __p0, int64x2_t __p1) { 65402 int64x2_t __ret; 65403 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 65404 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 65405 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2); 65406 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 65407 return __ret; 65408 } 65409 #endif 65410 65411 #ifdef __LITTLE_ENDIAN__ 65412 __ai __attribute__((target("neon"))) int16x8_t vuzp1q_s16(int16x8_t __p0, int16x8_t __p1) { 65413 int16x8_t __ret; 65414 __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6, 8, 10, 12, 14); 65415 return __ret; 65416 } 65417 #else 65418 __ai __attribute__((target("neon"))) int16x8_t vuzp1q_s16(int16x8_t __p0, int16x8_t __p1) { 65419 int16x8_t __ret; 65420 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 65421 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 65422 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6, 8, 10, 12, 14); 65423 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 65424 return __ret; 65425 } 65426 #endif 65427 65428 #ifdef __LITTLE_ENDIAN__ 65429 __ai __attribute__((target("neon"))) uint8x8_t vuzp1_u8(uint8x8_t __p0, uint8x8_t __p1) { 65430 uint8x8_t __ret; 65431 __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6, 8, 10, 12, 14); 65432 return __ret; 65433 } 65434 #else 65435 __ai __attribute__((target("neon"))) uint8x8_t vuzp1_u8(uint8x8_t __p0, uint8x8_t __p1) { 65436 uint8x8_t __ret; 65437 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 65438 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 65439 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6, 8, 10, 12, 14); 65440 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 65441 return __ret; 65442 } 65443 #endif 65444 65445 #ifdef __LITTLE_ENDIAN__ 65446 __ai __attribute__((target("neon"))) uint32x2_t vuzp1_u32(uint32x2_t __p0, uint32x2_t __p1) { 65447 uint32x2_t __ret; 65448 __ret = __builtin_shufflevector(__p0, __p1, 0, 2); 65449 return __ret; 65450 } 65451 #else 65452 __ai __attribute__((target("neon"))) uint32x2_t vuzp1_u32(uint32x2_t __p0, uint32x2_t __p1) { 65453 uint32x2_t __ret; 65454 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 65455 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 65456 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2); 65457 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 65458 return __ret; 65459 } 65460 #endif 65461 65462 #ifdef __LITTLE_ENDIAN__ 65463 __ai __attribute__((target("neon"))) uint16x4_t vuzp1_u16(uint16x4_t __p0, uint16x4_t __p1) { 65464 uint16x4_t __ret; 65465 __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6); 65466 return __ret; 65467 } 65468 #else 65469 __ai __attribute__((target("neon"))) uint16x4_t vuzp1_u16(uint16x4_t __p0, uint16x4_t __p1) { 65470 uint16x4_t __ret; 65471 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 65472 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 65473 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6); 65474 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 65475 return __ret; 65476 } 65477 #endif 65478 65479 #ifdef __LITTLE_ENDIAN__ 65480 __ai __attribute__((target("neon"))) int8x8_t vuzp1_s8(int8x8_t __p0, int8x8_t __p1) { 65481 int8x8_t __ret; 65482 __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6, 8, 10, 12, 14); 65483 return __ret; 65484 } 65485 #else 65486 __ai __attribute__((target("neon"))) int8x8_t vuzp1_s8(int8x8_t __p0, int8x8_t __p1) { 65487 int8x8_t __ret; 65488 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 65489 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 65490 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6, 8, 10, 12, 14); 65491 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 65492 return __ret; 65493 } 65494 #endif 65495 65496 #ifdef __LITTLE_ENDIAN__ 65497 __ai __attribute__((target("neon"))) float32x2_t vuzp1_f32(float32x2_t __p0, float32x2_t __p1) { 65498 float32x2_t __ret; 65499 __ret = __builtin_shufflevector(__p0, __p1, 0, 2); 65500 return __ret; 65501 } 65502 #else 65503 __ai __attribute__((target("neon"))) float32x2_t vuzp1_f32(float32x2_t __p0, float32x2_t __p1) { 65504 float32x2_t __ret; 65505 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 65506 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 65507 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2); 65508 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 65509 return __ret; 65510 } 65511 #endif 65512 65513 #ifdef __LITTLE_ENDIAN__ 65514 __ai __attribute__((target("neon"))) int32x2_t vuzp1_s32(int32x2_t __p0, int32x2_t __p1) { 65515 int32x2_t __ret; 65516 __ret = __builtin_shufflevector(__p0, __p1, 0, 2); 65517 return __ret; 65518 } 65519 #else 65520 __ai __attribute__((target("neon"))) int32x2_t vuzp1_s32(int32x2_t __p0, int32x2_t __p1) { 65521 int32x2_t __ret; 65522 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 65523 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 65524 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2); 65525 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 65526 return __ret; 65527 } 65528 #endif 65529 65530 #ifdef __LITTLE_ENDIAN__ 65531 __ai __attribute__((target("neon"))) int16x4_t vuzp1_s16(int16x4_t __p0, int16x4_t __p1) { 65532 int16x4_t __ret; 65533 __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6); 65534 return __ret; 65535 } 65536 #else 65537 __ai __attribute__((target("neon"))) int16x4_t vuzp1_s16(int16x4_t __p0, int16x4_t __p1) { 65538 int16x4_t __ret; 65539 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 65540 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 65541 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6); 65542 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 65543 return __ret; 65544 } 65545 #endif 65546 65547 #ifdef __LITTLE_ENDIAN__ 65548 __ai __attribute__((target("neon"))) float16x8_t vuzp1q_f16(float16x8_t __p0, float16x8_t __p1) { 65549 float16x8_t __ret; 65550 __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6, 8, 10, 12, 14); 65551 return __ret; 65552 } 65553 #else 65554 __ai __attribute__((target("neon"))) float16x8_t vuzp1q_f16(float16x8_t __p0, float16x8_t __p1) { 65555 float16x8_t __ret; 65556 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 65557 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 65558 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6, 8, 10, 12, 14); 65559 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 65560 return __ret; 65561 } 65562 #endif 65563 65564 #ifdef __LITTLE_ENDIAN__ 65565 __ai __attribute__((target("neon"))) float16x4_t vuzp1_f16(float16x4_t __p0, float16x4_t __p1) { 65566 float16x4_t __ret; 65567 __ret = __builtin_shufflevector(__p0, __p1, 0, 2, 4, 6); 65568 return __ret; 65569 } 65570 #else 65571 __ai __attribute__((target("neon"))) float16x4_t vuzp1_f16(float16x4_t __p0, float16x4_t __p1) { 65572 float16x4_t __ret; 65573 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 65574 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 65575 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2, 4, 6); 65576 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 65577 return __ret; 65578 } 65579 #endif 65580 65581 #ifdef __LITTLE_ENDIAN__ 65582 __ai __attribute__((target("neon"))) poly8x8_t vuzp2_p8(poly8x8_t __p0, poly8x8_t __p1) { 65583 poly8x8_t __ret; 65584 __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7, 9, 11, 13, 15); 65585 return __ret; 65586 } 65587 #else 65588 __ai __attribute__((target("neon"))) poly8x8_t vuzp2_p8(poly8x8_t __p0, poly8x8_t __p1) { 65589 poly8x8_t __ret; 65590 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 65591 poly8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 65592 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7, 9, 11, 13, 15); 65593 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 65594 return __ret; 65595 } 65596 #endif 65597 65598 #ifdef __LITTLE_ENDIAN__ 65599 __ai __attribute__((target("neon"))) poly16x4_t vuzp2_p16(poly16x4_t __p0, poly16x4_t __p1) { 65600 poly16x4_t __ret; 65601 __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7); 65602 return __ret; 65603 } 65604 #else 65605 __ai __attribute__((target("neon"))) poly16x4_t vuzp2_p16(poly16x4_t __p0, poly16x4_t __p1) { 65606 poly16x4_t __ret; 65607 poly16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 65608 poly16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 65609 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7); 65610 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 65611 return __ret; 65612 } 65613 #endif 65614 65615 #ifdef __LITTLE_ENDIAN__ 65616 __ai __attribute__((target("neon"))) poly8x16_t vuzp2q_p8(poly8x16_t __p0, poly8x16_t __p1) { 65617 poly8x16_t __ret; 65618 __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7, 9, 11, 13, 15, 17, 19, 21, 23, 25, 27, 29, 31); 65619 return __ret; 65620 } 65621 #else 65622 __ai __attribute__((target("neon"))) poly8x16_t vuzp2q_p8(poly8x16_t __p0, poly8x16_t __p1) { 65623 poly8x16_t __ret; 65624 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 65625 poly8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 65626 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7, 9, 11, 13, 15, 17, 19, 21, 23, 25, 27, 29, 31); 65627 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 65628 return __ret; 65629 } 65630 #endif 65631 65632 #ifdef __LITTLE_ENDIAN__ 65633 __ai __attribute__((target("neon"))) poly64x2_t vuzp2q_p64(poly64x2_t __p0, poly64x2_t __p1) { 65634 poly64x2_t __ret; 65635 __ret = __builtin_shufflevector(__p0, __p1, 1, 3); 65636 return __ret; 65637 } 65638 #else 65639 __ai __attribute__((target("neon"))) poly64x2_t vuzp2q_p64(poly64x2_t __p0, poly64x2_t __p1) { 65640 poly64x2_t __ret; 65641 poly64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 65642 poly64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 65643 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3); 65644 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 65645 return __ret; 65646 } 65647 #endif 65648 65649 #ifdef __LITTLE_ENDIAN__ 65650 __ai __attribute__((target("neon"))) poly16x8_t vuzp2q_p16(poly16x8_t __p0, poly16x8_t __p1) { 65651 poly16x8_t __ret; 65652 __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7, 9, 11, 13, 15); 65653 return __ret; 65654 } 65655 #else 65656 __ai __attribute__((target("neon"))) poly16x8_t vuzp2q_p16(poly16x8_t __p0, poly16x8_t __p1) { 65657 poly16x8_t __ret; 65658 poly16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 65659 poly16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 65660 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7, 9, 11, 13, 15); 65661 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 65662 return __ret; 65663 } 65664 #endif 65665 65666 #ifdef __LITTLE_ENDIAN__ 65667 __ai __attribute__((target("neon"))) uint8x16_t vuzp2q_u8(uint8x16_t __p0, uint8x16_t __p1) { 65668 uint8x16_t __ret; 65669 __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7, 9, 11, 13, 15, 17, 19, 21, 23, 25, 27, 29, 31); 65670 return __ret; 65671 } 65672 #else 65673 __ai __attribute__((target("neon"))) uint8x16_t vuzp2q_u8(uint8x16_t __p0, uint8x16_t __p1) { 65674 uint8x16_t __ret; 65675 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 65676 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 65677 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7, 9, 11, 13, 15, 17, 19, 21, 23, 25, 27, 29, 31); 65678 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 65679 return __ret; 65680 } 65681 #endif 65682 65683 #ifdef __LITTLE_ENDIAN__ 65684 __ai __attribute__((target("neon"))) uint32x4_t vuzp2q_u32(uint32x4_t __p0, uint32x4_t __p1) { 65685 uint32x4_t __ret; 65686 __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7); 65687 return __ret; 65688 } 65689 #else 65690 __ai __attribute__((target("neon"))) uint32x4_t vuzp2q_u32(uint32x4_t __p0, uint32x4_t __p1) { 65691 uint32x4_t __ret; 65692 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 65693 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 65694 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7); 65695 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 65696 return __ret; 65697 } 65698 #endif 65699 65700 #ifdef __LITTLE_ENDIAN__ 65701 __ai __attribute__((target("neon"))) uint64x2_t vuzp2q_u64(uint64x2_t __p0, uint64x2_t __p1) { 65702 uint64x2_t __ret; 65703 __ret = __builtin_shufflevector(__p0, __p1, 1, 3); 65704 return __ret; 65705 } 65706 #else 65707 __ai __attribute__((target("neon"))) uint64x2_t vuzp2q_u64(uint64x2_t __p0, uint64x2_t __p1) { 65708 uint64x2_t __ret; 65709 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 65710 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 65711 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3); 65712 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 65713 return __ret; 65714 } 65715 #endif 65716 65717 #ifdef __LITTLE_ENDIAN__ 65718 __ai __attribute__((target("neon"))) uint16x8_t vuzp2q_u16(uint16x8_t __p0, uint16x8_t __p1) { 65719 uint16x8_t __ret; 65720 __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7, 9, 11, 13, 15); 65721 return __ret; 65722 } 65723 #else 65724 __ai __attribute__((target("neon"))) uint16x8_t vuzp2q_u16(uint16x8_t __p0, uint16x8_t __p1) { 65725 uint16x8_t __ret; 65726 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 65727 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 65728 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7, 9, 11, 13, 15); 65729 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 65730 return __ret; 65731 } 65732 #endif 65733 65734 #ifdef __LITTLE_ENDIAN__ 65735 __ai __attribute__((target("neon"))) int8x16_t vuzp2q_s8(int8x16_t __p0, int8x16_t __p1) { 65736 int8x16_t __ret; 65737 __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7, 9, 11, 13, 15, 17, 19, 21, 23, 25, 27, 29, 31); 65738 return __ret; 65739 } 65740 #else 65741 __ai __attribute__((target("neon"))) int8x16_t vuzp2q_s8(int8x16_t __p0, int8x16_t __p1) { 65742 int8x16_t __ret; 65743 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 65744 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 65745 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7, 9, 11, 13, 15, 17, 19, 21, 23, 25, 27, 29, 31); 65746 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 65747 return __ret; 65748 } 65749 #endif 65750 65751 #ifdef __LITTLE_ENDIAN__ 65752 __ai __attribute__((target("neon"))) float64x2_t vuzp2q_f64(float64x2_t __p0, float64x2_t __p1) { 65753 float64x2_t __ret; 65754 __ret = __builtin_shufflevector(__p0, __p1, 1, 3); 65755 return __ret; 65756 } 65757 #else 65758 __ai __attribute__((target("neon"))) float64x2_t vuzp2q_f64(float64x2_t __p0, float64x2_t __p1) { 65759 float64x2_t __ret; 65760 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 65761 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 65762 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3); 65763 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 65764 return __ret; 65765 } 65766 #endif 65767 65768 #ifdef __LITTLE_ENDIAN__ 65769 __ai __attribute__((target("neon"))) float32x4_t vuzp2q_f32(float32x4_t __p0, float32x4_t __p1) { 65770 float32x4_t __ret; 65771 __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7); 65772 return __ret; 65773 } 65774 #else 65775 __ai __attribute__((target("neon"))) float32x4_t vuzp2q_f32(float32x4_t __p0, float32x4_t __p1) { 65776 float32x4_t __ret; 65777 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 65778 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 65779 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7); 65780 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 65781 return __ret; 65782 } 65783 #endif 65784 65785 #ifdef __LITTLE_ENDIAN__ 65786 __ai __attribute__((target("neon"))) int32x4_t vuzp2q_s32(int32x4_t __p0, int32x4_t __p1) { 65787 int32x4_t __ret; 65788 __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7); 65789 return __ret; 65790 } 65791 #else 65792 __ai __attribute__((target("neon"))) int32x4_t vuzp2q_s32(int32x4_t __p0, int32x4_t __p1) { 65793 int32x4_t __ret; 65794 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 65795 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 65796 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7); 65797 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 65798 return __ret; 65799 } 65800 #endif 65801 65802 #ifdef __LITTLE_ENDIAN__ 65803 __ai __attribute__((target("neon"))) int64x2_t vuzp2q_s64(int64x2_t __p0, int64x2_t __p1) { 65804 int64x2_t __ret; 65805 __ret = __builtin_shufflevector(__p0, __p1, 1, 3); 65806 return __ret; 65807 } 65808 #else 65809 __ai __attribute__((target("neon"))) int64x2_t vuzp2q_s64(int64x2_t __p0, int64x2_t __p1) { 65810 int64x2_t __ret; 65811 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 65812 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 65813 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3); 65814 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 65815 return __ret; 65816 } 65817 #endif 65818 65819 #ifdef __LITTLE_ENDIAN__ 65820 __ai __attribute__((target("neon"))) int16x8_t vuzp2q_s16(int16x8_t __p0, int16x8_t __p1) { 65821 int16x8_t __ret; 65822 __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7, 9, 11, 13, 15); 65823 return __ret; 65824 } 65825 #else 65826 __ai __attribute__((target("neon"))) int16x8_t vuzp2q_s16(int16x8_t __p0, int16x8_t __p1) { 65827 int16x8_t __ret; 65828 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 65829 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 65830 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7, 9, 11, 13, 15); 65831 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 65832 return __ret; 65833 } 65834 #endif 65835 65836 #ifdef __LITTLE_ENDIAN__ 65837 __ai __attribute__((target("neon"))) uint8x8_t vuzp2_u8(uint8x8_t __p0, uint8x8_t __p1) { 65838 uint8x8_t __ret; 65839 __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7, 9, 11, 13, 15); 65840 return __ret; 65841 } 65842 #else 65843 __ai __attribute__((target("neon"))) uint8x8_t vuzp2_u8(uint8x8_t __p0, uint8x8_t __p1) { 65844 uint8x8_t __ret; 65845 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 65846 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 65847 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7, 9, 11, 13, 15); 65848 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 65849 return __ret; 65850 } 65851 #endif 65852 65853 #ifdef __LITTLE_ENDIAN__ 65854 __ai __attribute__((target("neon"))) uint32x2_t vuzp2_u32(uint32x2_t __p0, uint32x2_t __p1) { 65855 uint32x2_t __ret; 65856 __ret = __builtin_shufflevector(__p0, __p1, 1, 3); 65857 return __ret; 65858 } 65859 #else 65860 __ai __attribute__((target("neon"))) uint32x2_t vuzp2_u32(uint32x2_t __p0, uint32x2_t __p1) { 65861 uint32x2_t __ret; 65862 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 65863 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 65864 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3); 65865 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 65866 return __ret; 65867 } 65868 #endif 65869 65870 #ifdef __LITTLE_ENDIAN__ 65871 __ai __attribute__((target("neon"))) uint16x4_t vuzp2_u16(uint16x4_t __p0, uint16x4_t __p1) { 65872 uint16x4_t __ret; 65873 __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7); 65874 return __ret; 65875 } 65876 #else 65877 __ai __attribute__((target("neon"))) uint16x4_t vuzp2_u16(uint16x4_t __p0, uint16x4_t __p1) { 65878 uint16x4_t __ret; 65879 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 65880 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 65881 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7); 65882 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 65883 return __ret; 65884 } 65885 #endif 65886 65887 #ifdef __LITTLE_ENDIAN__ 65888 __ai __attribute__((target("neon"))) int8x8_t vuzp2_s8(int8x8_t __p0, int8x8_t __p1) { 65889 int8x8_t __ret; 65890 __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7, 9, 11, 13, 15); 65891 return __ret; 65892 } 65893 #else 65894 __ai __attribute__((target("neon"))) int8x8_t vuzp2_s8(int8x8_t __p0, int8x8_t __p1) { 65895 int8x8_t __ret; 65896 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 65897 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 65898 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7, 9, 11, 13, 15); 65899 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 65900 return __ret; 65901 } 65902 #endif 65903 65904 #ifdef __LITTLE_ENDIAN__ 65905 __ai __attribute__((target("neon"))) float32x2_t vuzp2_f32(float32x2_t __p0, float32x2_t __p1) { 65906 float32x2_t __ret; 65907 __ret = __builtin_shufflevector(__p0, __p1, 1, 3); 65908 return __ret; 65909 } 65910 #else 65911 __ai __attribute__((target("neon"))) float32x2_t vuzp2_f32(float32x2_t __p0, float32x2_t __p1) { 65912 float32x2_t __ret; 65913 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 65914 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 65915 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3); 65916 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 65917 return __ret; 65918 } 65919 #endif 65920 65921 #ifdef __LITTLE_ENDIAN__ 65922 __ai __attribute__((target("neon"))) int32x2_t vuzp2_s32(int32x2_t __p0, int32x2_t __p1) { 65923 int32x2_t __ret; 65924 __ret = __builtin_shufflevector(__p0, __p1, 1, 3); 65925 return __ret; 65926 } 65927 #else 65928 __ai __attribute__((target("neon"))) int32x2_t vuzp2_s32(int32x2_t __p0, int32x2_t __p1) { 65929 int32x2_t __ret; 65930 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 65931 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 65932 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3); 65933 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 65934 return __ret; 65935 } 65936 #endif 65937 65938 #ifdef __LITTLE_ENDIAN__ 65939 __ai __attribute__((target("neon"))) int16x4_t vuzp2_s16(int16x4_t __p0, int16x4_t __p1) { 65940 int16x4_t __ret; 65941 __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7); 65942 return __ret; 65943 } 65944 #else 65945 __ai __attribute__((target("neon"))) int16x4_t vuzp2_s16(int16x4_t __p0, int16x4_t __p1) { 65946 int16x4_t __ret; 65947 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 65948 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 65949 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7); 65950 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 65951 return __ret; 65952 } 65953 #endif 65954 65955 #ifdef __LITTLE_ENDIAN__ 65956 __ai __attribute__((target("neon"))) float16x8_t vuzp2q_f16(float16x8_t __p0, float16x8_t __p1) { 65957 float16x8_t __ret; 65958 __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7, 9, 11, 13, 15); 65959 return __ret; 65960 } 65961 #else 65962 __ai __attribute__((target("neon"))) float16x8_t vuzp2q_f16(float16x8_t __p0, float16x8_t __p1) { 65963 float16x8_t __ret; 65964 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 65965 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 65966 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7, 9, 11, 13, 15); 65967 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 65968 return __ret; 65969 } 65970 #endif 65971 65972 #ifdef __LITTLE_ENDIAN__ 65973 __ai __attribute__((target("neon"))) float16x4_t vuzp2_f16(float16x4_t __p0, float16x4_t __p1) { 65974 float16x4_t __ret; 65975 __ret = __builtin_shufflevector(__p0, __p1, 1, 3, 5, 7); 65976 return __ret; 65977 } 65978 #else 65979 __ai __attribute__((target("neon"))) float16x4_t vuzp2_f16(float16x4_t __p0, float16x4_t __p1) { 65980 float16x4_t __ret; 65981 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 65982 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 65983 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3, 5, 7); 65984 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 65985 return __ret; 65986 } 65987 #endif 65988 65989 #ifdef __LITTLE_ENDIAN__ 65990 __ai __attribute__((target("neon"))) poly8x8_t vzip1_p8(poly8x8_t __p0, poly8x8_t __p1) { 65991 poly8x8_t __ret; 65992 __ret = __builtin_shufflevector(__p0, __p1, 0, 8, 1, 9, 2, 10, 3, 11); 65993 return __ret; 65994 } 65995 #else 65996 __ai __attribute__((target("neon"))) poly8x8_t vzip1_p8(poly8x8_t __p0, poly8x8_t __p1) { 65997 poly8x8_t __ret; 65998 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 65999 poly8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 66000 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 8, 1, 9, 2, 10, 3, 11); 66001 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 66002 return __ret; 66003 } 66004 #endif 66005 66006 #ifdef __LITTLE_ENDIAN__ 66007 __ai __attribute__((target("neon"))) poly16x4_t vzip1_p16(poly16x4_t __p0, poly16x4_t __p1) { 66008 poly16x4_t __ret; 66009 __ret = __builtin_shufflevector(__p0, __p1, 0, 4, 1, 5); 66010 return __ret; 66011 } 66012 #else 66013 __ai __attribute__((target("neon"))) poly16x4_t vzip1_p16(poly16x4_t __p0, poly16x4_t __p1) { 66014 poly16x4_t __ret; 66015 poly16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 66016 poly16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 66017 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 4, 1, 5); 66018 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 66019 return __ret; 66020 } 66021 #endif 66022 66023 #ifdef __LITTLE_ENDIAN__ 66024 __ai __attribute__((target("neon"))) poly8x16_t vzip1q_p8(poly8x16_t __p0, poly8x16_t __p1) { 66025 poly8x16_t __ret; 66026 __ret = __builtin_shufflevector(__p0, __p1, 0, 16, 1, 17, 2, 18, 3, 19, 4, 20, 5, 21, 6, 22, 7, 23); 66027 return __ret; 66028 } 66029 #else 66030 __ai __attribute__((target("neon"))) poly8x16_t vzip1q_p8(poly8x16_t __p0, poly8x16_t __p1) { 66031 poly8x16_t __ret; 66032 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 66033 poly8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 66034 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 16, 1, 17, 2, 18, 3, 19, 4, 20, 5, 21, 6, 22, 7, 23); 66035 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 66036 return __ret; 66037 } 66038 #endif 66039 66040 #ifdef __LITTLE_ENDIAN__ 66041 __ai __attribute__((target("neon"))) poly64x2_t vzip1q_p64(poly64x2_t __p0, poly64x2_t __p1) { 66042 poly64x2_t __ret; 66043 __ret = __builtin_shufflevector(__p0, __p1, 0, 2); 66044 return __ret; 66045 } 66046 #else 66047 __ai __attribute__((target("neon"))) poly64x2_t vzip1q_p64(poly64x2_t __p0, poly64x2_t __p1) { 66048 poly64x2_t __ret; 66049 poly64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 66050 poly64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 66051 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2); 66052 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 66053 return __ret; 66054 } 66055 #endif 66056 66057 #ifdef __LITTLE_ENDIAN__ 66058 __ai __attribute__((target("neon"))) poly16x8_t vzip1q_p16(poly16x8_t __p0, poly16x8_t __p1) { 66059 poly16x8_t __ret; 66060 __ret = __builtin_shufflevector(__p0, __p1, 0, 8, 1, 9, 2, 10, 3, 11); 66061 return __ret; 66062 } 66063 #else 66064 __ai __attribute__((target("neon"))) poly16x8_t vzip1q_p16(poly16x8_t __p0, poly16x8_t __p1) { 66065 poly16x8_t __ret; 66066 poly16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 66067 poly16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 66068 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 8, 1, 9, 2, 10, 3, 11); 66069 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 66070 return __ret; 66071 } 66072 #endif 66073 66074 #ifdef __LITTLE_ENDIAN__ 66075 __ai __attribute__((target("neon"))) uint8x16_t vzip1q_u8(uint8x16_t __p0, uint8x16_t __p1) { 66076 uint8x16_t __ret; 66077 __ret = __builtin_shufflevector(__p0, __p1, 0, 16, 1, 17, 2, 18, 3, 19, 4, 20, 5, 21, 6, 22, 7, 23); 66078 return __ret; 66079 } 66080 #else 66081 __ai __attribute__((target("neon"))) uint8x16_t vzip1q_u8(uint8x16_t __p0, uint8x16_t __p1) { 66082 uint8x16_t __ret; 66083 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 66084 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 66085 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 16, 1, 17, 2, 18, 3, 19, 4, 20, 5, 21, 6, 22, 7, 23); 66086 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 66087 return __ret; 66088 } 66089 #endif 66090 66091 #ifdef __LITTLE_ENDIAN__ 66092 __ai __attribute__((target("neon"))) uint32x4_t vzip1q_u32(uint32x4_t __p0, uint32x4_t __p1) { 66093 uint32x4_t __ret; 66094 __ret = __builtin_shufflevector(__p0, __p1, 0, 4, 1, 5); 66095 return __ret; 66096 } 66097 #else 66098 __ai __attribute__((target("neon"))) uint32x4_t vzip1q_u32(uint32x4_t __p0, uint32x4_t __p1) { 66099 uint32x4_t __ret; 66100 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 66101 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 66102 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 4, 1, 5); 66103 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 66104 return __ret; 66105 } 66106 #endif 66107 66108 #ifdef __LITTLE_ENDIAN__ 66109 __ai __attribute__((target("neon"))) uint64x2_t vzip1q_u64(uint64x2_t __p0, uint64x2_t __p1) { 66110 uint64x2_t __ret; 66111 __ret = __builtin_shufflevector(__p0, __p1, 0, 2); 66112 return __ret; 66113 } 66114 #else 66115 __ai __attribute__((target("neon"))) uint64x2_t vzip1q_u64(uint64x2_t __p0, uint64x2_t __p1) { 66116 uint64x2_t __ret; 66117 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 66118 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 66119 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2); 66120 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 66121 return __ret; 66122 } 66123 #endif 66124 66125 #ifdef __LITTLE_ENDIAN__ 66126 __ai __attribute__((target("neon"))) uint16x8_t vzip1q_u16(uint16x8_t __p0, uint16x8_t __p1) { 66127 uint16x8_t __ret; 66128 __ret = __builtin_shufflevector(__p0, __p1, 0, 8, 1, 9, 2, 10, 3, 11); 66129 return __ret; 66130 } 66131 #else 66132 __ai __attribute__((target("neon"))) uint16x8_t vzip1q_u16(uint16x8_t __p0, uint16x8_t __p1) { 66133 uint16x8_t __ret; 66134 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 66135 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 66136 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 8, 1, 9, 2, 10, 3, 11); 66137 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 66138 return __ret; 66139 } 66140 #endif 66141 66142 #ifdef __LITTLE_ENDIAN__ 66143 __ai __attribute__((target("neon"))) int8x16_t vzip1q_s8(int8x16_t __p0, int8x16_t __p1) { 66144 int8x16_t __ret; 66145 __ret = __builtin_shufflevector(__p0, __p1, 0, 16, 1, 17, 2, 18, 3, 19, 4, 20, 5, 21, 6, 22, 7, 23); 66146 return __ret; 66147 } 66148 #else 66149 __ai __attribute__((target("neon"))) int8x16_t vzip1q_s8(int8x16_t __p0, int8x16_t __p1) { 66150 int8x16_t __ret; 66151 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 66152 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 66153 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 16, 1, 17, 2, 18, 3, 19, 4, 20, 5, 21, 6, 22, 7, 23); 66154 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 66155 return __ret; 66156 } 66157 #endif 66158 66159 #ifdef __LITTLE_ENDIAN__ 66160 __ai __attribute__((target("neon"))) float64x2_t vzip1q_f64(float64x2_t __p0, float64x2_t __p1) { 66161 float64x2_t __ret; 66162 __ret = __builtin_shufflevector(__p0, __p1, 0, 2); 66163 return __ret; 66164 } 66165 #else 66166 __ai __attribute__((target("neon"))) float64x2_t vzip1q_f64(float64x2_t __p0, float64x2_t __p1) { 66167 float64x2_t __ret; 66168 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 66169 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 66170 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2); 66171 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 66172 return __ret; 66173 } 66174 #endif 66175 66176 #ifdef __LITTLE_ENDIAN__ 66177 __ai __attribute__((target("neon"))) float32x4_t vzip1q_f32(float32x4_t __p0, float32x4_t __p1) { 66178 float32x4_t __ret; 66179 __ret = __builtin_shufflevector(__p0, __p1, 0, 4, 1, 5); 66180 return __ret; 66181 } 66182 #else 66183 __ai __attribute__((target("neon"))) float32x4_t vzip1q_f32(float32x4_t __p0, float32x4_t __p1) { 66184 float32x4_t __ret; 66185 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 66186 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 66187 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 4, 1, 5); 66188 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 66189 return __ret; 66190 } 66191 #endif 66192 66193 #ifdef __LITTLE_ENDIAN__ 66194 __ai __attribute__((target("neon"))) int32x4_t vzip1q_s32(int32x4_t __p0, int32x4_t __p1) { 66195 int32x4_t __ret; 66196 __ret = __builtin_shufflevector(__p0, __p1, 0, 4, 1, 5); 66197 return __ret; 66198 } 66199 #else 66200 __ai __attribute__((target("neon"))) int32x4_t vzip1q_s32(int32x4_t __p0, int32x4_t __p1) { 66201 int32x4_t __ret; 66202 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 66203 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 66204 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 4, 1, 5); 66205 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 66206 return __ret; 66207 } 66208 #endif 66209 66210 #ifdef __LITTLE_ENDIAN__ 66211 __ai __attribute__((target("neon"))) int64x2_t vzip1q_s64(int64x2_t __p0, int64x2_t __p1) { 66212 int64x2_t __ret; 66213 __ret = __builtin_shufflevector(__p0, __p1, 0, 2); 66214 return __ret; 66215 } 66216 #else 66217 __ai __attribute__((target("neon"))) int64x2_t vzip1q_s64(int64x2_t __p0, int64x2_t __p1) { 66218 int64x2_t __ret; 66219 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 66220 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 66221 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2); 66222 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 66223 return __ret; 66224 } 66225 #endif 66226 66227 #ifdef __LITTLE_ENDIAN__ 66228 __ai __attribute__((target("neon"))) int16x8_t vzip1q_s16(int16x8_t __p0, int16x8_t __p1) { 66229 int16x8_t __ret; 66230 __ret = __builtin_shufflevector(__p0, __p1, 0, 8, 1, 9, 2, 10, 3, 11); 66231 return __ret; 66232 } 66233 #else 66234 __ai __attribute__((target("neon"))) int16x8_t vzip1q_s16(int16x8_t __p0, int16x8_t __p1) { 66235 int16x8_t __ret; 66236 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 66237 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 66238 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 8, 1, 9, 2, 10, 3, 11); 66239 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 66240 return __ret; 66241 } 66242 #endif 66243 66244 #ifdef __LITTLE_ENDIAN__ 66245 __ai __attribute__((target("neon"))) uint8x8_t vzip1_u8(uint8x8_t __p0, uint8x8_t __p1) { 66246 uint8x8_t __ret; 66247 __ret = __builtin_shufflevector(__p0, __p1, 0, 8, 1, 9, 2, 10, 3, 11); 66248 return __ret; 66249 } 66250 #else 66251 __ai __attribute__((target("neon"))) uint8x8_t vzip1_u8(uint8x8_t __p0, uint8x8_t __p1) { 66252 uint8x8_t __ret; 66253 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 66254 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 66255 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 8, 1, 9, 2, 10, 3, 11); 66256 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 66257 return __ret; 66258 } 66259 #endif 66260 66261 #ifdef __LITTLE_ENDIAN__ 66262 __ai __attribute__((target("neon"))) uint32x2_t vzip1_u32(uint32x2_t __p0, uint32x2_t __p1) { 66263 uint32x2_t __ret; 66264 __ret = __builtin_shufflevector(__p0, __p1, 0, 2); 66265 return __ret; 66266 } 66267 #else 66268 __ai __attribute__((target("neon"))) uint32x2_t vzip1_u32(uint32x2_t __p0, uint32x2_t __p1) { 66269 uint32x2_t __ret; 66270 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 66271 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 66272 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2); 66273 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 66274 return __ret; 66275 } 66276 #endif 66277 66278 #ifdef __LITTLE_ENDIAN__ 66279 __ai __attribute__((target("neon"))) uint16x4_t vzip1_u16(uint16x4_t __p0, uint16x4_t __p1) { 66280 uint16x4_t __ret; 66281 __ret = __builtin_shufflevector(__p0, __p1, 0, 4, 1, 5); 66282 return __ret; 66283 } 66284 #else 66285 __ai __attribute__((target("neon"))) uint16x4_t vzip1_u16(uint16x4_t __p0, uint16x4_t __p1) { 66286 uint16x4_t __ret; 66287 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 66288 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 66289 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 4, 1, 5); 66290 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 66291 return __ret; 66292 } 66293 #endif 66294 66295 #ifdef __LITTLE_ENDIAN__ 66296 __ai __attribute__((target("neon"))) int8x8_t vzip1_s8(int8x8_t __p0, int8x8_t __p1) { 66297 int8x8_t __ret; 66298 __ret = __builtin_shufflevector(__p0, __p1, 0, 8, 1, 9, 2, 10, 3, 11); 66299 return __ret; 66300 } 66301 #else 66302 __ai __attribute__((target("neon"))) int8x8_t vzip1_s8(int8x8_t __p0, int8x8_t __p1) { 66303 int8x8_t __ret; 66304 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 66305 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 66306 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 8, 1, 9, 2, 10, 3, 11); 66307 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 66308 return __ret; 66309 } 66310 #endif 66311 66312 #ifdef __LITTLE_ENDIAN__ 66313 __ai __attribute__((target("neon"))) float32x2_t vzip1_f32(float32x2_t __p0, float32x2_t __p1) { 66314 float32x2_t __ret; 66315 __ret = __builtin_shufflevector(__p0, __p1, 0, 2); 66316 return __ret; 66317 } 66318 #else 66319 __ai __attribute__((target("neon"))) float32x2_t vzip1_f32(float32x2_t __p0, float32x2_t __p1) { 66320 float32x2_t __ret; 66321 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 66322 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 66323 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2); 66324 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 66325 return __ret; 66326 } 66327 #endif 66328 66329 #ifdef __LITTLE_ENDIAN__ 66330 __ai __attribute__((target("neon"))) int32x2_t vzip1_s32(int32x2_t __p0, int32x2_t __p1) { 66331 int32x2_t __ret; 66332 __ret = __builtin_shufflevector(__p0, __p1, 0, 2); 66333 return __ret; 66334 } 66335 #else 66336 __ai __attribute__((target("neon"))) int32x2_t vzip1_s32(int32x2_t __p0, int32x2_t __p1) { 66337 int32x2_t __ret; 66338 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 66339 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 66340 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 2); 66341 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 66342 return __ret; 66343 } 66344 #endif 66345 66346 #ifdef __LITTLE_ENDIAN__ 66347 __ai __attribute__((target("neon"))) int16x4_t vzip1_s16(int16x4_t __p0, int16x4_t __p1) { 66348 int16x4_t __ret; 66349 __ret = __builtin_shufflevector(__p0, __p1, 0, 4, 1, 5); 66350 return __ret; 66351 } 66352 #else 66353 __ai __attribute__((target("neon"))) int16x4_t vzip1_s16(int16x4_t __p0, int16x4_t __p1) { 66354 int16x4_t __ret; 66355 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 66356 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 66357 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 4, 1, 5); 66358 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 66359 return __ret; 66360 } 66361 #endif 66362 66363 #ifdef __LITTLE_ENDIAN__ 66364 __ai __attribute__((target("neon"))) float16x8_t vzip1q_f16(float16x8_t __p0, float16x8_t __p1) { 66365 float16x8_t __ret; 66366 __ret = __builtin_shufflevector(__p0, __p1, 0, 8, 1, 9, 2, 10, 3, 11); 66367 return __ret; 66368 } 66369 #else 66370 __ai __attribute__((target("neon"))) float16x8_t vzip1q_f16(float16x8_t __p0, float16x8_t __p1) { 66371 float16x8_t __ret; 66372 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 66373 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 66374 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 8, 1, 9, 2, 10, 3, 11); 66375 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 66376 return __ret; 66377 } 66378 #endif 66379 66380 #ifdef __LITTLE_ENDIAN__ 66381 __ai __attribute__((target("neon"))) float16x4_t vzip1_f16(float16x4_t __p0, float16x4_t __p1) { 66382 float16x4_t __ret; 66383 __ret = __builtin_shufflevector(__p0, __p1, 0, 4, 1, 5); 66384 return __ret; 66385 } 66386 #else 66387 __ai __attribute__((target("neon"))) float16x4_t vzip1_f16(float16x4_t __p0, float16x4_t __p1) { 66388 float16x4_t __ret; 66389 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 66390 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 66391 __ret = __builtin_shufflevector(__rev0, __rev1, 0, 4, 1, 5); 66392 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 66393 return __ret; 66394 } 66395 #endif 66396 66397 #ifdef __LITTLE_ENDIAN__ 66398 __ai __attribute__((target("neon"))) poly8x8_t vzip2_p8(poly8x8_t __p0, poly8x8_t __p1) { 66399 poly8x8_t __ret; 66400 __ret = __builtin_shufflevector(__p0, __p1, 4, 12, 5, 13, 6, 14, 7, 15); 66401 return __ret; 66402 } 66403 #else 66404 __ai __attribute__((target("neon"))) poly8x8_t vzip2_p8(poly8x8_t __p0, poly8x8_t __p1) { 66405 poly8x8_t __ret; 66406 poly8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 66407 poly8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 66408 __ret = __builtin_shufflevector(__rev0, __rev1, 4, 12, 5, 13, 6, 14, 7, 15); 66409 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 66410 return __ret; 66411 } 66412 #endif 66413 66414 #ifdef __LITTLE_ENDIAN__ 66415 __ai __attribute__((target("neon"))) poly16x4_t vzip2_p16(poly16x4_t __p0, poly16x4_t __p1) { 66416 poly16x4_t __ret; 66417 __ret = __builtin_shufflevector(__p0, __p1, 2, 6, 3, 7); 66418 return __ret; 66419 } 66420 #else 66421 __ai __attribute__((target("neon"))) poly16x4_t vzip2_p16(poly16x4_t __p0, poly16x4_t __p1) { 66422 poly16x4_t __ret; 66423 poly16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 66424 poly16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 66425 __ret = __builtin_shufflevector(__rev0, __rev1, 2, 6, 3, 7); 66426 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 66427 return __ret; 66428 } 66429 #endif 66430 66431 #ifdef __LITTLE_ENDIAN__ 66432 __ai __attribute__((target("neon"))) poly8x16_t vzip2q_p8(poly8x16_t __p0, poly8x16_t __p1) { 66433 poly8x16_t __ret; 66434 __ret = __builtin_shufflevector(__p0, __p1, 8, 24, 9, 25, 10, 26, 11, 27, 12, 28, 13, 29, 14, 30, 15, 31); 66435 return __ret; 66436 } 66437 #else 66438 __ai __attribute__((target("neon"))) poly8x16_t vzip2q_p8(poly8x16_t __p0, poly8x16_t __p1) { 66439 poly8x16_t __ret; 66440 poly8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 66441 poly8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 66442 __ret = __builtin_shufflevector(__rev0, __rev1, 8, 24, 9, 25, 10, 26, 11, 27, 12, 28, 13, 29, 14, 30, 15, 31); 66443 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 66444 return __ret; 66445 } 66446 #endif 66447 66448 #ifdef __LITTLE_ENDIAN__ 66449 __ai __attribute__((target("neon"))) poly64x2_t vzip2q_p64(poly64x2_t __p0, poly64x2_t __p1) { 66450 poly64x2_t __ret; 66451 __ret = __builtin_shufflevector(__p0, __p1, 1, 3); 66452 return __ret; 66453 } 66454 #else 66455 __ai __attribute__((target("neon"))) poly64x2_t vzip2q_p64(poly64x2_t __p0, poly64x2_t __p1) { 66456 poly64x2_t __ret; 66457 poly64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 66458 poly64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 66459 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3); 66460 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 66461 return __ret; 66462 } 66463 #endif 66464 66465 #ifdef __LITTLE_ENDIAN__ 66466 __ai __attribute__((target("neon"))) poly16x8_t vzip2q_p16(poly16x8_t __p0, poly16x8_t __p1) { 66467 poly16x8_t __ret; 66468 __ret = __builtin_shufflevector(__p0, __p1, 4, 12, 5, 13, 6, 14, 7, 15); 66469 return __ret; 66470 } 66471 #else 66472 __ai __attribute__((target("neon"))) poly16x8_t vzip2q_p16(poly16x8_t __p0, poly16x8_t __p1) { 66473 poly16x8_t __ret; 66474 poly16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 66475 poly16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 66476 __ret = __builtin_shufflevector(__rev0, __rev1, 4, 12, 5, 13, 6, 14, 7, 15); 66477 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 66478 return __ret; 66479 } 66480 #endif 66481 66482 #ifdef __LITTLE_ENDIAN__ 66483 __ai __attribute__((target("neon"))) uint8x16_t vzip2q_u8(uint8x16_t __p0, uint8x16_t __p1) { 66484 uint8x16_t __ret; 66485 __ret = __builtin_shufflevector(__p0, __p1, 8, 24, 9, 25, 10, 26, 11, 27, 12, 28, 13, 29, 14, 30, 15, 31); 66486 return __ret; 66487 } 66488 #else 66489 __ai __attribute__((target("neon"))) uint8x16_t vzip2q_u8(uint8x16_t __p0, uint8x16_t __p1) { 66490 uint8x16_t __ret; 66491 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 66492 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 66493 __ret = __builtin_shufflevector(__rev0, __rev1, 8, 24, 9, 25, 10, 26, 11, 27, 12, 28, 13, 29, 14, 30, 15, 31); 66494 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 66495 return __ret; 66496 } 66497 #endif 66498 66499 #ifdef __LITTLE_ENDIAN__ 66500 __ai __attribute__((target("neon"))) uint32x4_t vzip2q_u32(uint32x4_t __p0, uint32x4_t __p1) { 66501 uint32x4_t __ret; 66502 __ret = __builtin_shufflevector(__p0, __p1, 2, 6, 3, 7); 66503 return __ret; 66504 } 66505 #else 66506 __ai __attribute__((target("neon"))) uint32x4_t vzip2q_u32(uint32x4_t __p0, uint32x4_t __p1) { 66507 uint32x4_t __ret; 66508 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 66509 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 66510 __ret = __builtin_shufflevector(__rev0, __rev1, 2, 6, 3, 7); 66511 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 66512 return __ret; 66513 } 66514 #endif 66515 66516 #ifdef __LITTLE_ENDIAN__ 66517 __ai __attribute__((target("neon"))) uint64x2_t vzip2q_u64(uint64x2_t __p0, uint64x2_t __p1) { 66518 uint64x2_t __ret; 66519 __ret = __builtin_shufflevector(__p0, __p1, 1, 3); 66520 return __ret; 66521 } 66522 #else 66523 __ai __attribute__((target("neon"))) uint64x2_t vzip2q_u64(uint64x2_t __p0, uint64x2_t __p1) { 66524 uint64x2_t __ret; 66525 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 66526 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 66527 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3); 66528 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 66529 return __ret; 66530 } 66531 #endif 66532 66533 #ifdef __LITTLE_ENDIAN__ 66534 __ai __attribute__((target("neon"))) uint16x8_t vzip2q_u16(uint16x8_t __p0, uint16x8_t __p1) { 66535 uint16x8_t __ret; 66536 __ret = __builtin_shufflevector(__p0, __p1, 4, 12, 5, 13, 6, 14, 7, 15); 66537 return __ret; 66538 } 66539 #else 66540 __ai __attribute__((target("neon"))) uint16x8_t vzip2q_u16(uint16x8_t __p0, uint16x8_t __p1) { 66541 uint16x8_t __ret; 66542 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 66543 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 66544 __ret = __builtin_shufflevector(__rev0, __rev1, 4, 12, 5, 13, 6, 14, 7, 15); 66545 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 66546 return __ret; 66547 } 66548 #endif 66549 66550 #ifdef __LITTLE_ENDIAN__ 66551 __ai __attribute__((target("neon"))) int8x16_t vzip2q_s8(int8x16_t __p0, int8x16_t __p1) { 66552 int8x16_t __ret; 66553 __ret = __builtin_shufflevector(__p0, __p1, 8, 24, 9, 25, 10, 26, 11, 27, 12, 28, 13, 29, 14, 30, 15, 31); 66554 return __ret; 66555 } 66556 #else 66557 __ai __attribute__((target("neon"))) int8x16_t vzip2q_s8(int8x16_t __p0, int8x16_t __p1) { 66558 int8x16_t __ret; 66559 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 66560 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 66561 __ret = __builtin_shufflevector(__rev0, __rev1, 8, 24, 9, 25, 10, 26, 11, 27, 12, 28, 13, 29, 14, 30, 15, 31); 66562 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 66563 return __ret; 66564 } 66565 #endif 66566 66567 #ifdef __LITTLE_ENDIAN__ 66568 __ai __attribute__((target("neon"))) float64x2_t vzip2q_f64(float64x2_t __p0, float64x2_t __p1) { 66569 float64x2_t __ret; 66570 __ret = __builtin_shufflevector(__p0, __p1, 1, 3); 66571 return __ret; 66572 } 66573 #else 66574 __ai __attribute__((target("neon"))) float64x2_t vzip2q_f64(float64x2_t __p0, float64x2_t __p1) { 66575 float64x2_t __ret; 66576 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 66577 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 66578 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3); 66579 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 66580 return __ret; 66581 } 66582 #endif 66583 66584 #ifdef __LITTLE_ENDIAN__ 66585 __ai __attribute__((target("neon"))) float32x4_t vzip2q_f32(float32x4_t __p0, float32x4_t __p1) { 66586 float32x4_t __ret; 66587 __ret = __builtin_shufflevector(__p0, __p1, 2, 6, 3, 7); 66588 return __ret; 66589 } 66590 #else 66591 __ai __attribute__((target("neon"))) float32x4_t vzip2q_f32(float32x4_t __p0, float32x4_t __p1) { 66592 float32x4_t __ret; 66593 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 66594 float32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 66595 __ret = __builtin_shufflevector(__rev0, __rev1, 2, 6, 3, 7); 66596 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 66597 return __ret; 66598 } 66599 #endif 66600 66601 #ifdef __LITTLE_ENDIAN__ 66602 __ai __attribute__((target("neon"))) int32x4_t vzip2q_s32(int32x4_t __p0, int32x4_t __p1) { 66603 int32x4_t __ret; 66604 __ret = __builtin_shufflevector(__p0, __p1, 2, 6, 3, 7); 66605 return __ret; 66606 } 66607 #else 66608 __ai __attribute__((target("neon"))) int32x4_t vzip2q_s32(int32x4_t __p0, int32x4_t __p1) { 66609 int32x4_t __ret; 66610 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 66611 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 66612 __ret = __builtin_shufflevector(__rev0, __rev1, 2, 6, 3, 7); 66613 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 66614 return __ret; 66615 } 66616 #endif 66617 66618 #ifdef __LITTLE_ENDIAN__ 66619 __ai __attribute__((target("neon"))) int64x2_t vzip2q_s64(int64x2_t __p0, int64x2_t __p1) { 66620 int64x2_t __ret; 66621 __ret = __builtin_shufflevector(__p0, __p1, 1, 3); 66622 return __ret; 66623 } 66624 #else 66625 __ai __attribute__((target("neon"))) int64x2_t vzip2q_s64(int64x2_t __p0, int64x2_t __p1) { 66626 int64x2_t __ret; 66627 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 66628 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 66629 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3); 66630 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 66631 return __ret; 66632 } 66633 #endif 66634 66635 #ifdef __LITTLE_ENDIAN__ 66636 __ai __attribute__((target("neon"))) int16x8_t vzip2q_s16(int16x8_t __p0, int16x8_t __p1) { 66637 int16x8_t __ret; 66638 __ret = __builtin_shufflevector(__p0, __p1, 4, 12, 5, 13, 6, 14, 7, 15); 66639 return __ret; 66640 } 66641 #else 66642 __ai __attribute__((target("neon"))) int16x8_t vzip2q_s16(int16x8_t __p0, int16x8_t __p1) { 66643 int16x8_t __ret; 66644 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 66645 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 66646 __ret = __builtin_shufflevector(__rev0, __rev1, 4, 12, 5, 13, 6, 14, 7, 15); 66647 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 66648 return __ret; 66649 } 66650 #endif 66651 66652 #ifdef __LITTLE_ENDIAN__ 66653 __ai __attribute__((target("neon"))) uint8x8_t vzip2_u8(uint8x8_t __p0, uint8x8_t __p1) { 66654 uint8x8_t __ret; 66655 __ret = __builtin_shufflevector(__p0, __p1, 4, 12, 5, 13, 6, 14, 7, 15); 66656 return __ret; 66657 } 66658 #else 66659 __ai __attribute__((target("neon"))) uint8x8_t vzip2_u8(uint8x8_t __p0, uint8x8_t __p1) { 66660 uint8x8_t __ret; 66661 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 66662 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 66663 __ret = __builtin_shufflevector(__rev0, __rev1, 4, 12, 5, 13, 6, 14, 7, 15); 66664 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 66665 return __ret; 66666 } 66667 #endif 66668 66669 #ifdef __LITTLE_ENDIAN__ 66670 __ai __attribute__((target("neon"))) uint32x2_t vzip2_u32(uint32x2_t __p0, uint32x2_t __p1) { 66671 uint32x2_t __ret; 66672 __ret = __builtin_shufflevector(__p0, __p1, 1, 3); 66673 return __ret; 66674 } 66675 #else 66676 __ai __attribute__((target("neon"))) uint32x2_t vzip2_u32(uint32x2_t __p0, uint32x2_t __p1) { 66677 uint32x2_t __ret; 66678 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 66679 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 66680 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3); 66681 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 66682 return __ret; 66683 } 66684 #endif 66685 66686 #ifdef __LITTLE_ENDIAN__ 66687 __ai __attribute__((target("neon"))) uint16x4_t vzip2_u16(uint16x4_t __p0, uint16x4_t __p1) { 66688 uint16x4_t __ret; 66689 __ret = __builtin_shufflevector(__p0, __p1, 2, 6, 3, 7); 66690 return __ret; 66691 } 66692 #else 66693 __ai __attribute__((target("neon"))) uint16x4_t vzip2_u16(uint16x4_t __p0, uint16x4_t __p1) { 66694 uint16x4_t __ret; 66695 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 66696 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 66697 __ret = __builtin_shufflevector(__rev0, __rev1, 2, 6, 3, 7); 66698 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 66699 return __ret; 66700 } 66701 #endif 66702 66703 #ifdef __LITTLE_ENDIAN__ 66704 __ai __attribute__((target("neon"))) int8x8_t vzip2_s8(int8x8_t __p0, int8x8_t __p1) { 66705 int8x8_t __ret; 66706 __ret = __builtin_shufflevector(__p0, __p1, 4, 12, 5, 13, 6, 14, 7, 15); 66707 return __ret; 66708 } 66709 #else 66710 __ai __attribute__((target("neon"))) int8x8_t vzip2_s8(int8x8_t __p0, int8x8_t __p1) { 66711 int8x8_t __ret; 66712 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 66713 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 66714 __ret = __builtin_shufflevector(__rev0, __rev1, 4, 12, 5, 13, 6, 14, 7, 15); 66715 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 66716 return __ret; 66717 } 66718 #endif 66719 66720 #ifdef __LITTLE_ENDIAN__ 66721 __ai __attribute__((target("neon"))) float32x2_t vzip2_f32(float32x2_t __p0, float32x2_t __p1) { 66722 float32x2_t __ret; 66723 __ret = __builtin_shufflevector(__p0, __p1, 1, 3); 66724 return __ret; 66725 } 66726 #else 66727 __ai __attribute__((target("neon"))) float32x2_t vzip2_f32(float32x2_t __p0, float32x2_t __p1) { 66728 float32x2_t __ret; 66729 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 66730 float32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 66731 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3); 66732 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 66733 return __ret; 66734 } 66735 #endif 66736 66737 #ifdef __LITTLE_ENDIAN__ 66738 __ai __attribute__((target("neon"))) int32x2_t vzip2_s32(int32x2_t __p0, int32x2_t __p1) { 66739 int32x2_t __ret; 66740 __ret = __builtin_shufflevector(__p0, __p1, 1, 3); 66741 return __ret; 66742 } 66743 #else 66744 __ai __attribute__((target("neon"))) int32x2_t vzip2_s32(int32x2_t __p0, int32x2_t __p1) { 66745 int32x2_t __ret; 66746 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 66747 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 66748 __ret = __builtin_shufflevector(__rev0, __rev1, 1, 3); 66749 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 66750 return __ret; 66751 } 66752 #endif 66753 66754 #ifdef __LITTLE_ENDIAN__ 66755 __ai __attribute__((target("neon"))) int16x4_t vzip2_s16(int16x4_t __p0, int16x4_t __p1) { 66756 int16x4_t __ret; 66757 __ret = __builtin_shufflevector(__p0, __p1, 2, 6, 3, 7); 66758 return __ret; 66759 } 66760 #else 66761 __ai __attribute__((target("neon"))) int16x4_t vzip2_s16(int16x4_t __p0, int16x4_t __p1) { 66762 int16x4_t __ret; 66763 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 66764 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 66765 __ret = __builtin_shufflevector(__rev0, __rev1, 2, 6, 3, 7); 66766 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 66767 return __ret; 66768 } 66769 #endif 66770 66771 #ifdef __LITTLE_ENDIAN__ 66772 __ai __attribute__((target("neon"))) float16x8_t vzip2q_f16(float16x8_t __p0, float16x8_t __p1) { 66773 float16x8_t __ret; 66774 __ret = __builtin_shufflevector(__p0, __p1, 4, 12, 5, 13, 6, 14, 7, 15); 66775 return __ret; 66776 } 66777 #else 66778 __ai __attribute__((target("neon"))) float16x8_t vzip2q_f16(float16x8_t __p0, float16x8_t __p1) { 66779 float16x8_t __ret; 66780 float16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 66781 float16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 66782 __ret = __builtin_shufflevector(__rev0, __rev1, 4, 12, 5, 13, 6, 14, 7, 15); 66783 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 66784 return __ret; 66785 } 66786 #endif 66787 66788 #ifdef __LITTLE_ENDIAN__ 66789 __ai __attribute__((target("neon"))) float16x4_t vzip2_f16(float16x4_t __p0, float16x4_t __p1) { 66790 float16x4_t __ret; 66791 __ret = __builtin_shufflevector(__p0, __p1, 2, 6, 3, 7); 66792 return __ret; 66793 } 66794 #else 66795 __ai __attribute__((target("neon"))) float16x4_t vzip2_f16(float16x4_t __p0, float16x4_t __p1) { 66796 float16x4_t __ret; 66797 float16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 66798 float16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 66799 __ret = __builtin_shufflevector(__rev0, __rev1, 2, 6, 3, 7); 66800 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 66801 return __ret; 66802 } 66803 #endif 66804 66805 #define vldap1_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 66806 poly64x1_t __ret; \ 66807 poly64x1_t __s1 = __p1; \ 66808 __ret = (poly64x1_t) __builtin_neon_vldap1_lane_p64(__p0, (int8x8_t)__s1, __p2, 6); \ 66809 __ret; \ 66810 }) 66811 #ifdef __LITTLE_ENDIAN__ 66812 #define vldap1q_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 66813 poly64x2_t __ret; \ 66814 poly64x2_t __s1 = __p1; \ 66815 __ret = (poly64x2_t) __builtin_neon_vldap1q_lane_p64(__p0, (int8x16_t)__s1, __p2, 38); \ 66816 __ret; \ 66817 }) 66818 #else 66819 #define vldap1q_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 66820 poly64x2_t __ret; \ 66821 poly64x2_t __s1 = __p1; \ 66822 poly64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 66823 __ret = (poly64x2_t) __builtin_neon_vldap1q_lane_p64(__p0, (int8x16_t)__rev1, __p2, 38); \ 66824 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 66825 __ret; \ 66826 }) 66827 #endif 66828 66829 #ifdef __LITTLE_ENDIAN__ 66830 #define vldap1q_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 66831 uint64x2_t __ret; \ 66832 uint64x2_t __s1 = __p1; \ 66833 __ret = (uint64x2_t) __builtin_neon_vldap1q_lane_u64(__p0, (int8x16_t)__s1, __p2, 51); \ 66834 __ret; \ 66835 }) 66836 #else 66837 #define vldap1q_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 66838 uint64x2_t __ret; \ 66839 uint64x2_t __s1 = __p1; \ 66840 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 66841 __ret = (uint64x2_t) __builtin_neon_vldap1q_lane_u64(__p0, (int8x16_t)__rev1, __p2, 51); \ 66842 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 66843 __ret; \ 66844 }) 66845 #endif 66846 66847 #ifdef __LITTLE_ENDIAN__ 66848 #define vldap1q_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 66849 float64x2_t __ret; \ 66850 float64x2_t __s1 = __p1; \ 66851 __ret = (float64x2_t) __builtin_neon_vldap1q_lane_f64(__p0, (int8x16_t)__s1, __p2, 42); \ 66852 __ret; \ 66853 }) 66854 #else 66855 #define vldap1q_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 66856 float64x2_t __ret; \ 66857 float64x2_t __s1 = __p1; \ 66858 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 66859 __ret = (float64x2_t) __builtin_neon_vldap1q_lane_f64(__p0, (int8x16_t)__rev1, __p2, 42); \ 66860 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 66861 __ret; \ 66862 }) 66863 #endif 66864 66865 #ifdef __LITTLE_ENDIAN__ 66866 #define vldap1q_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 66867 int64x2_t __ret; \ 66868 int64x2_t __s1 = __p1; \ 66869 __ret = (int64x2_t) __builtin_neon_vldap1q_lane_s64(__p0, (int8x16_t)__s1, __p2, 35); \ 66870 __ret; \ 66871 }) 66872 #else 66873 #define vldap1q_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 66874 int64x2_t __ret; \ 66875 int64x2_t __s1 = __p1; \ 66876 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 66877 __ret = (int64x2_t) __builtin_neon_vldap1q_lane_s64(__p0, (int8x16_t)__rev1, __p2, 35); \ 66878 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 66879 __ret; \ 66880 }) 66881 #endif 66882 66883 #define vldap1_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 66884 uint64x1_t __ret; \ 66885 uint64x1_t __s1 = __p1; \ 66886 __ret = (uint64x1_t) __builtin_neon_vldap1_lane_u64(__p0, (int8x8_t)__s1, __p2, 19); \ 66887 __ret; \ 66888 }) 66889 #define vldap1_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 66890 float64x1_t __ret; \ 66891 float64x1_t __s1 = __p1; \ 66892 __ret = (float64x1_t) __builtin_neon_vldap1_lane_f64(__p0, (int8x8_t)__s1, __p2, 10); \ 66893 __ret; \ 66894 }) 66895 #define vldap1_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 66896 int64x1_t __ret; \ 66897 int64x1_t __s1 = __p1; \ 66898 __ret = (int64x1_t) __builtin_neon_vldap1_lane_s64(__p0, (int8x8_t)__s1, __p2, 3); \ 66899 __ret; \ 66900 }) 66901 #define vstl1_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 66902 poly64x1_t __s1 = __p1; \ 66903 __builtin_neon_vstl1_lane_p64(__p0, (int8x8_t)__s1, __p2, 6); \ 66904 }) 66905 #ifdef __LITTLE_ENDIAN__ 66906 #define vstl1q_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 66907 poly64x2_t __s1 = __p1; \ 66908 __builtin_neon_vstl1q_lane_p64(__p0, (int8x16_t)__s1, __p2, 38); \ 66909 }) 66910 #else 66911 #define vstl1q_lane_p64(__p0, __p1, __p2) __extension__ ({ \ 66912 poly64x2_t __s1 = __p1; \ 66913 poly64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 66914 __builtin_neon_vstl1q_lane_p64(__p0, (int8x16_t)__rev1, __p2, 38); \ 66915 }) 66916 #endif 66917 66918 #ifdef __LITTLE_ENDIAN__ 66919 #define vstl1q_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 66920 uint64x2_t __s1 = __p1; \ 66921 __builtin_neon_vstl1q_lane_u64(__p0, (int8x16_t)__s1, __p2, 51); \ 66922 }) 66923 #else 66924 #define vstl1q_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 66925 uint64x2_t __s1 = __p1; \ 66926 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 66927 __builtin_neon_vstl1q_lane_u64(__p0, (int8x16_t)__rev1, __p2, 51); \ 66928 }) 66929 #endif 66930 66931 #ifdef __LITTLE_ENDIAN__ 66932 #define vstl1q_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 66933 float64x2_t __s1 = __p1; \ 66934 __builtin_neon_vstl1q_lane_f64(__p0, (int8x16_t)__s1, __p2, 42); \ 66935 }) 66936 #else 66937 #define vstl1q_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 66938 float64x2_t __s1 = __p1; \ 66939 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 66940 __builtin_neon_vstl1q_lane_f64(__p0, (int8x16_t)__rev1, __p2, 42); \ 66941 }) 66942 #endif 66943 66944 #ifdef __LITTLE_ENDIAN__ 66945 #define vstl1q_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 66946 int64x2_t __s1 = __p1; \ 66947 __builtin_neon_vstl1q_lane_s64(__p0, (int8x16_t)__s1, __p2, 35); \ 66948 }) 66949 #else 66950 #define vstl1q_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 66951 int64x2_t __s1 = __p1; \ 66952 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 66953 __builtin_neon_vstl1q_lane_s64(__p0, (int8x16_t)__rev1, __p2, 35); \ 66954 }) 66955 #endif 66956 66957 #define vstl1_lane_u64(__p0, __p1, __p2) __extension__ ({ \ 66958 uint64x1_t __s1 = __p1; \ 66959 __builtin_neon_vstl1_lane_u64(__p0, (int8x8_t)__s1, __p2, 19); \ 66960 }) 66961 #define vstl1_lane_f64(__p0, __p1, __p2) __extension__ ({ \ 66962 float64x1_t __s1 = __p1; \ 66963 __builtin_neon_vstl1_lane_f64(__p0, (int8x8_t)__s1, __p2, 10); \ 66964 }) 66965 #define vstl1_lane_s64(__p0, __p1, __p2) __extension__ ({ \ 66966 int64x1_t __s1 = __p1; \ 66967 __builtin_neon_vstl1_lane_s64(__p0, (int8x8_t)__s1, __p2, 3); \ 66968 }) 66969 #ifdef __LITTLE_ENDIAN__ 66970 __ai __attribute__((target("sha3,neon"))) uint8x16_t vbcaxq_u8(uint8x16_t __p0, uint8x16_t __p1, uint8x16_t __p2) { 66971 uint8x16_t __ret; 66972 __ret = (uint8x16_t) __builtin_neon_vbcaxq_u8((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 48); 66973 return __ret; 66974 } 66975 #else 66976 __ai __attribute__((target("sha3,neon"))) uint8x16_t vbcaxq_u8(uint8x16_t __p0, uint8x16_t __p1, uint8x16_t __p2) { 66977 uint8x16_t __ret; 66978 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 66979 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 66980 uint8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 66981 __ret = (uint8x16_t) __builtin_neon_vbcaxq_u8((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 48); 66982 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 66983 return __ret; 66984 } 66985 #endif 66986 66987 #ifdef __LITTLE_ENDIAN__ 66988 __ai __attribute__((target("sha3,neon"))) uint32x4_t vbcaxq_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 66989 uint32x4_t __ret; 66990 __ret = (uint32x4_t) __builtin_neon_vbcaxq_u32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 50); 66991 return __ret; 66992 } 66993 #else 66994 __ai __attribute__((target("sha3,neon"))) uint32x4_t vbcaxq_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 66995 uint32x4_t __ret; 66996 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 66997 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 66998 uint32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 66999 __ret = (uint32x4_t) __builtin_neon_vbcaxq_u32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 50); 67000 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 67001 return __ret; 67002 } 67003 #endif 67004 67005 #ifdef __LITTLE_ENDIAN__ 67006 __ai __attribute__((target("sha3,neon"))) uint64x2_t vbcaxq_u64(uint64x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) { 67007 uint64x2_t __ret; 67008 __ret = (uint64x2_t) __builtin_neon_vbcaxq_u64((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 51); 67009 return __ret; 67010 } 67011 #else 67012 __ai __attribute__((target("sha3,neon"))) uint64x2_t vbcaxq_u64(uint64x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) { 67013 uint64x2_t __ret; 67014 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 67015 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 67016 uint64x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 67017 __ret = (uint64x2_t) __builtin_neon_vbcaxq_u64((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 51); 67018 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 67019 return __ret; 67020 } 67021 #endif 67022 67023 #ifdef __LITTLE_ENDIAN__ 67024 __ai __attribute__((target("sha3,neon"))) uint16x8_t vbcaxq_u16(uint16x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) { 67025 uint16x8_t __ret; 67026 __ret = (uint16x8_t) __builtin_neon_vbcaxq_u16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 49); 67027 return __ret; 67028 } 67029 #else 67030 __ai __attribute__((target("sha3,neon"))) uint16x8_t vbcaxq_u16(uint16x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) { 67031 uint16x8_t __ret; 67032 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 67033 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 67034 uint16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 67035 __ret = (uint16x8_t) __builtin_neon_vbcaxq_u16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 49); 67036 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 67037 return __ret; 67038 } 67039 #endif 67040 67041 #ifdef __LITTLE_ENDIAN__ 67042 __ai __attribute__((target("sha3,neon"))) int8x16_t vbcaxq_s8(int8x16_t __p0, int8x16_t __p1, int8x16_t __p2) { 67043 int8x16_t __ret; 67044 __ret = (int8x16_t) __builtin_neon_vbcaxq_s8((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 32); 67045 return __ret; 67046 } 67047 #else 67048 __ai __attribute__((target("sha3,neon"))) int8x16_t vbcaxq_s8(int8x16_t __p0, int8x16_t __p1, int8x16_t __p2) { 67049 int8x16_t __ret; 67050 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 67051 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 67052 int8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 67053 __ret = (int8x16_t) __builtin_neon_vbcaxq_s8((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 32); 67054 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 67055 return __ret; 67056 } 67057 #endif 67058 67059 #ifdef __LITTLE_ENDIAN__ 67060 __ai __attribute__((target("sha3,neon"))) int32x4_t vbcaxq_s32(int32x4_t __p0, int32x4_t __p1, int32x4_t __p2) { 67061 int32x4_t __ret; 67062 __ret = (int32x4_t) __builtin_neon_vbcaxq_s32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 34); 67063 return __ret; 67064 } 67065 #else 67066 __ai __attribute__((target("sha3,neon"))) int32x4_t vbcaxq_s32(int32x4_t __p0, int32x4_t __p1, int32x4_t __p2) { 67067 int32x4_t __ret; 67068 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 67069 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 67070 int32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 67071 __ret = (int32x4_t) __builtin_neon_vbcaxq_s32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 34); 67072 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 67073 return __ret; 67074 } 67075 #endif 67076 67077 #ifdef __LITTLE_ENDIAN__ 67078 __ai __attribute__((target("sha3,neon"))) int64x2_t vbcaxq_s64(int64x2_t __p0, int64x2_t __p1, int64x2_t __p2) { 67079 int64x2_t __ret; 67080 __ret = (int64x2_t) __builtin_neon_vbcaxq_s64((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 35); 67081 return __ret; 67082 } 67083 #else 67084 __ai __attribute__((target("sha3,neon"))) int64x2_t vbcaxq_s64(int64x2_t __p0, int64x2_t __p1, int64x2_t __p2) { 67085 int64x2_t __ret; 67086 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 67087 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 67088 int64x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 67089 __ret = (int64x2_t) __builtin_neon_vbcaxq_s64((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 35); 67090 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 67091 return __ret; 67092 } 67093 #endif 67094 67095 #ifdef __LITTLE_ENDIAN__ 67096 __ai __attribute__((target("sha3,neon"))) int16x8_t vbcaxq_s16(int16x8_t __p0, int16x8_t __p1, int16x8_t __p2) { 67097 int16x8_t __ret; 67098 __ret = (int16x8_t) __builtin_neon_vbcaxq_s16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 33); 67099 return __ret; 67100 } 67101 #else 67102 __ai __attribute__((target("sha3,neon"))) int16x8_t vbcaxq_s16(int16x8_t __p0, int16x8_t __p1, int16x8_t __p2) { 67103 int16x8_t __ret; 67104 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 67105 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 67106 int16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 67107 __ret = (int16x8_t) __builtin_neon_vbcaxq_s16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 33); 67108 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 67109 return __ret; 67110 } 67111 #endif 67112 67113 #ifdef __LITTLE_ENDIAN__ 67114 __ai __attribute__((target("sha3,neon"))) uint8x16_t veor3q_u8(uint8x16_t __p0, uint8x16_t __p1, uint8x16_t __p2) { 67115 uint8x16_t __ret; 67116 __ret = (uint8x16_t) __builtin_neon_veor3q_u8((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 48); 67117 return __ret; 67118 } 67119 #else 67120 __ai __attribute__((target("sha3,neon"))) uint8x16_t veor3q_u8(uint8x16_t __p0, uint8x16_t __p1, uint8x16_t __p2) { 67121 uint8x16_t __ret; 67122 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 67123 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 67124 uint8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 67125 __ret = (uint8x16_t) __builtin_neon_veor3q_u8((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 48); 67126 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 67127 return __ret; 67128 } 67129 #endif 67130 67131 #ifdef __LITTLE_ENDIAN__ 67132 __ai __attribute__((target("sha3,neon"))) uint32x4_t veor3q_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 67133 uint32x4_t __ret; 67134 __ret = (uint32x4_t) __builtin_neon_veor3q_u32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 50); 67135 return __ret; 67136 } 67137 #else 67138 __ai __attribute__((target("sha3,neon"))) uint32x4_t veor3q_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 67139 uint32x4_t __ret; 67140 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 67141 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 67142 uint32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 67143 __ret = (uint32x4_t) __builtin_neon_veor3q_u32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 50); 67144 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 67145 return __ret; 67146 } 67147 #endif 67148 67149 #ifdef __LITTLE_ENDIAN__ 67150 __ai __attribute__((target("sha3,neon"))) uint64x2_t veor3q_u64(uint64x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) { 67151 uint64x2_t __ret; 67152 __ret = (uint64x2_t) __builtin_neon_veor3q_u64((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 51); 67153 return __ret; 67154 } 67155 #else 67156 __ai __attribute__((target("sha3,neon"))) uint64x2_t veor3q_u64(uint64x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) { 67157 uint64x2_t __ret; 67158 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 67159 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 67160 uint64x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 67161 __ret = (uint64x2_t) __builtin_neon_veor3q_u64((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 51); 67162 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 67163 return __ret; 67164 } 67165 #endif 67166 67167 #ifdef __LITTLE_ENDIAN__ 67168 __ai __attribute__((target("sha3,neon"))) uint16x8_t veor3q_u16(uint16x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) { 67169 uint16x8_t __ret; 67170 __ret = (uint16x8_t) __builtin_neon_veor3q_u16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 49); 67171 return __ret; 67172 } 67173 #else 67174 __ai __attribute__((target("sha3,neon"))) uint16x8_t veor3q_u16(uint16x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) { 67175 uint16x8_t __ret; 67176 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 67177 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 67178 uint16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 67179 __ret = (uint16x8_t) __builtin_neon_veor3q_u16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 49); 67180 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 67181 return __ret; 67182 } 67183 #endif 67184 67185 #ifdef __LITTLE_ENDIAN__ 67186 __ai __attribute__((target("sha3,neon"))) int8x16_t veor3q_s8(int8x16_t __p0, int8x16_t __p1, int8x16_t __p2) { 67187 int8x16_t __ret; 67188 __ret = (int8x16_t) __builtin_neon_veor3q_s8((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 32); 67189 return __ret; 67190 } 67191 #else 67192 __ai __attribute__((target("sha3,neon"))) int8x16_t veor3q_s8(int8x16_t __p0, int8x16_t __p1, int8x16_t __p2) { 67193 int8x16_t __ret; 67194 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 67195 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 67196 int8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 67197 __ret = (int8x16_t) __builtin_neon_veor3q_s8((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 32); 67198 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 67199 return __ret; 67200 } 67201 #endif 67202 67203 #ifdef __LITTLE_ENDIAN__ 67204 __ai __attribute__((target("sha3,neon"))) int32x4_t veor3q_s32(int32x4_t __p0, int32x4_t __p1, int32x4_t __p2) { 67205 int32x4_t __ret; 67206 __ret = (int32x4_t) __builtin_neon_veor3q_s32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 34); 67207 return __ret; 67208 } 67209 #else 67210 __ai __attribute__((target("sha3,neon"))) int32x4_t veor3q_s32(int32x4_t __p0, int32x4_t __p1, int32x4_t __p2) { 67211 int32x4_t __ret; 67212 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 67213 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 67214 int32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 67215 __ret = (int32x4_t) __builtin_neon_veor3q_s32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 34); 67216 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 67217 return __ret; 67218 } 67219 #endif 67220 67221 #ifdef __LITTLE_ENDIAN__ 67222 __ai __attribute__((target("sha3,neon"))) int64x2_t veor3q_s64(int64x2_t __p0, int64x2_t __p1, int64x2_t __p2) { 67223 int64x2_t __ret; 67224 __ret = (int64x2_t) __builtin_neon_veor3q_s64((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 35); 67225 return __ret; 67226 } 67227 #else 67228 __ai __attribute__((target("sha3,neon"))) int64x2_t veor3q_s64(int64x2_t __p0, int64x2_t __p1, int64x2_t __p2) { 67229 int64x2_t __ret; 67230 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 67231 int64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 67232 int64x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 67233 __ret = (int64x2_t) __builtin_neon_veor3q_s64((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 35); 67234 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 67235 return __ret; 67236 } 67237 #endif 67238 67239 #ifdef __LITTLE_ENDIAN__ 67240 __ai __attribute__((target("sha3,neon"))) int16x8_t veor3q_s16(int16x8_t __p0, int16x8_t __p1, int16x8_t __p2) { 67241 int16x8_t __ret; 67242 __ret = (int16x8_t) __builtin_neon_veor3q_s16((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 33); 67243 return __ret; 67244 } 67245 #else 67246 __ai __attribute__((target("sha3,neon"))) int16x8_t veor3q_s16(int16x8_t __p0, int16x8_t __p1, int16x8_t __p2) { 67247 int16x8_t __ret; 67248 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 67249 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 67250 int16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 67251 __ret = (int16x8_t) __builtin_neon_veor3q_s16((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 33); 67252 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 67253 return __ret; 67254 } 67255 #endif 67256 67257 #ifdef __LITTLE_ENDIAN__ 67258 __ai __attribute__((target("sha3,neon"))) uint64x2_t vrax1q_u64(uint64x2_t __p0, uint64x2_t __p1) { 67259 uint64x2_t __ret; 67260 __ret = (uint64x2_t) __builtin_neon_vrax1q_u64((int8x16_t)__p0, (int8x16_t)__p1, 51); 67261 return __ret; 67262 } 67263 #else 67264 __ai __attribute__((target("sha3,neon"))) uint64x2_t vrax1q_u64(uint64x2_t __p0, uint64x2_t __p1) { 67265 uint64x2_t __ret; 67266 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 67267 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 67268 __ret = (uint64x2_t) __builtin_neon_vrax1q_u64((int8x16_t)__rev0, (int8x16_t)__rev1, 51); 67269 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 67270 return __ret; 67271 } 67272 #endif 67273 67274 #ifdef __LITTLE_ENDIAN__ 67275 __ai __attribute__((target("sha3,neon"))) uint64x2_t vsha512hq_u64(uint64x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) { 67276 uint64x2_t __ret; 67277 __ret = (uint64x2_t) __builtin_neon_vsha512hq_u64((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 51); 67278 return __ret; 67279 } 67280 #else 67281 __ai __attribute__((target("sha3,neon"))) uint64x2_t vsha512hq_u64(uint64x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) { 67282 uint64x2_t __ret; 67283 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 67284 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 67285 uint64x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 67286 __ret = (uint64x2_t) __builtin_neon_vsha512hq_u64((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 51); 67287 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 67288 return __ret; 67289 } 67290 #endif 67291 67292 #ifdef __LITTLE_ENDIAN__ 67293 __ai __attribute__((target("sha3,neon"))) uint64x2_t vsha512h2q_u64(uint64x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) { 67294 uint64x2_t __ret; 67295 __ret = (uint64x2_t) __builtin_neon_vsha512h2q_u64((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 51); 67296 return __ret; 67297 } 67298 #else 67299 __ai __attribute__((target("sha3,neon"))) uint64x2_t vsha512h2q_u64(uint64x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) { 67300 uint64x2_t __ret; 67301 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 67302 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 67303 uint64x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 67304 __ret = (uint64x2_t) __builtin_neon_vsha512h2q_u64((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 51); 67305 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 67306 return __ret; 67307 } 67308 #endif 67309 67310 #ifdef __LITTLE_ENDIAN__ 67311 __ai __attribute__((target("sha3,neon"))) uint64x2_t vsha512su0q_u64(uint64x2_t __p0, uint64x2_t __p1) { 67312 uint64x2_t __ret; 67313 __ret = (uint64x2_t) __builtin_neon_vsha512su0q_u64((int8x16_t)__p0, (int8x16_t)__p1, 51); 67314 return __ret; 67315 } 67316 #else 67317 __ai __attribute__((target("sha3,neon"))) uint64x2_t vsha512su0q_u64(uint64x2_t __p0, uint64x2_t __p1) { 67318 uint64x2_t __ret; 67319 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 67320 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 67321 __ret = (uint64x2_t) __builtin_neon_vsha512su0q_u64((int8x16_t)__rev0, (int8x16_t)__rev1, 51); 67322 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 67323 return __ret; 67324 } 67325 #endif 67326 67327 #ifdef __LITTLE_ENDIAN__ 67328 __ai __attribute__((target("sha3,neon"))) uint64x2_t vsha512su1q_u64(uint64x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) { 67329 uint64x2_t __ret; 67330 __ret = (uint64x2_t) __builtin_neon_vsha512su1q_u64((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 51); 67331 return __ret; 67332 } 67333 #else 67334 __ai __attribute__((target("sha3,neon"))) uint64x2_t vsha512su1q_u64(uint64x2_t __p0, uint64x2_t __p1, uint64x2_t __p2) { 67335 uint64x2_t __ret; 67336 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 67337 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 67338 uint64x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 67339 __ret = (uint64x2_t) __builtin_neon_vsha512su1q_u64((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 51); 67340 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 67341 return __ret; 67342 } 67343 #endif 67344 67345 #ifdef __LITTLE_ENDIAN__ 67346 #define vxarq_u64(__p0, __p1, __p2) __extension__ ({ \ 67347 uint64x2_t __ret; \ 67348 uint64x2_t __s0 = __p0; \ 67349 uint64x2_t __s1 = __p1; \ 67350 __ret = (uint64x2_t) __builtin_neon_vxarq_u64((int8x16_t)__s0, (int8x16_t)__s1, __p2, 51); \ 67351 __ret; \ 67352 }) 67353 #else 67354 #define vxarq_u64(__p0, __p1, __p2) __extension__ ({ \ 67355 uint64x2_t __ret; \ 67356 uint64x2_t __s0 = __p0; \ 67357 uint64x2_t __s1 = __p1; \ 67358 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 1, 0); \ 67359 uint64x2_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 1, 0); \ 67360 __ret = (uint64x2_t) __builtin_neon_vxarq_u64((int8x16_t)__rev0, (int8x16_t)__rev1, __p2, 51); \ 67361 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); \ 67362 __ret; \ 67363 }) 67364 #endif 67365 67366 #ifdef __LITTLE_ENDIAN__ 67367 __ai __attribute__((target("sm4,neon"))) uint32x4_t vsm3partw1q_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 67368 uint32x4_t __ret; 67369 __ret = (uint32x4_t) __builtin_neon_vsm3partw1q_u32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 50); 67370 return __ret; 67371 } 67372 #else 67373 __ai __attribute__((target("sm4,neon"))) uint32x4_t vsm3partw1q_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 67374 uint32x4_t __ret; 67375 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 67376 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 67377 uint32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 67378 __ret = (uint32x4_t) __builtin_neon_vsm3partw1q_u32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 50); 67379 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 67380 return __ret; 67381 } 67382 #endif 67383 67384 #ifdef __LITTLE_ENDIAN__ 67385 __ai __attribute__((target("sm4,neon"))) uint32x4_t vsm3partw2q_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 67386 uint32x4_t __ret; 67387 __ret = (uint32x4_t) __builtin_neon_vsm3partw2q_u32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 50); 67388 return __ret; 67389 } 67390 #else 67391 __ai __attribute__((target("sm4,neon"))) uint32x4_t vsm3partw2q_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 67392 uint32x4_t __ret; 67393 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 67394 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 67395 uint32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 67396 __ret = (uint32x4_t) __builtin_neon_vsm3partw2q_u32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 50); 67397 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 67398 return __ret; 67399 } 67400 #endif 67401 67402 #ifdef __LITTLE_ENDIAN__ 67403 __ai __attribute__((target("sm4,neon"))) uint32x4_t vsm3ss1q_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 67404 uint32x4_t __ret; 67405 __ret = (uint32x4_t) __builtin_neon_vsm3ss1q_u32((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 50); 67406 return __ret; 67407 } 67408 #else 67409 __ai __attribute__((target("sm4,neon"))) uint32x4_t vsm3ss1q_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 67410 uint32x4_t __ret; 67411 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 67412 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 67413 uint32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 67414 __ret = (uint32x4_t) __builtin_neon_vsm3ss1q_u32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 50); 67415 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 67416 return __ret; 67417 } 67418 #endif 67419 67420 #ifdef __LITTLE_ENDIAN__ 67421 #define vsm3tt1aq_u32(__p0, __p1, __p2, __p3) __extension__ ({ \ 67422 uint32x4_t __ret; \ 67423 uint32x4_t __s0 = __p0; \ 67424 uint32x4_t __s1 = __p1; \ 67425 uint32x4_t __s2 = __p2; \ 67426 __ret = (uint32x4_t) __builtin_neon_vsm3tt1aq_u32((int8x16_t)__s0, (int8x16_t)__s1, (int8x16_t)__s2, __p3, 50); \ 67427 __ret; \ 67428 }) 67429 #else 67430 #define vsm3tt1aq_u32(__p0, __p1, __p2, __p3) __extension__ ({ \ 67431 uint32x4_t __ret; \ 67432 uint32x4_t __s0 = __p0; \ 67433 uint32x4_t __s1 = __p1; \ 67434 uint32x4_t __s2 = __p2; \ 67435 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 67436 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 67437 uint32x4_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 3, 2, 1, 0); \ 67438 __ret = (uint32x4_t) __builtin_neon_vsm3tt1aq_u32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, __p3, 50); \ 67439 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 67440 __ret; \ 67441 }) 67442 #endif 67443 67444 #ifdef __LITTLE_ENDIAN__ 67445 #define vsm3tt1bq_u32(__p0, __p1, __p2, __p3) __extension__ ({ \ 67446 uint32x4_t __ret; \ 67447 uint32x4_t __s0 = __p0; \ 67448 uint32x4_t __s1 = __p1; \ 67449 uint32x4_t __s2 = __p2; \ 67450 __ret = (uint32x4_t) __builtin_neon_vsm3tt1bq_u32((int8x16_t)__s0, (int8x16_t)__s1, (int8x16_t)__s2, __p3, 50); \ 67451 __ret; \ 67452 }) 67453 #else 67454 #define vsm3tt1bq_u32(__p0, __p1, __p2, __p3) __extension__ ({ \ 67455 uint32x4_t __ret; \ 67456 uint32x4_t __s0 = __p0; \ 67457 uint32x4_t __s1 = __p1; \ 67458 uint32x4_t __s2 = __p2; \ 67459 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 67460 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 67461 uint32x4_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 3, 2, 1, 0); \ 67462 __ret = (uint32x4_t) __builtin_neon_vsm3tt1bq_u32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, __p3, 50); \ 67463 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 67464 __ret; \ 67465 }) 67466 #endif 67467 67468 #ifdef __LITTLE_ENDIAN__ 67469 #define vsm3tt2aq_u32(__p0, __p1, __p2, __p3) __extension__ ({ \ 67470 uint32x4_t __ret; \ 67471 uint32x4_t __s0 = __p0; \ 67472 uint32x4_t __s1 = __p1; \ 67473 uint32x4_t __s2 = __p2; \ 67474 __ret = (uint32x4_t) __builtin_neon_vsm3tt2aq_u32((int8x16_t)__s0, (int8x16_t)__s1, (int8x16_t)__s2, __p3, 50); \ 67475 __ret; \ 67476 }) 67477 #else 67478 #define vsm3tt2aq_u32(__p0, __p1, __p2, __p3) __extension__ ({ \ 67479 uint32x4_t __ret; \ 67480 uint32x4_t __s0 = __p0; \ 67481 uint32x4_t __s1 = __p1; \ 67482 uint32x4_t __s2 = __p2; \ 67483 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 67484 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 67485 uint32x4_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 3, 2, 1, 0); \ 67486 __ret = (uint32x4_t) __builtin_neon_vsm3tt2aq_u32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, __p3, 50); \ 67487 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 67488 __ret; \ 67489 }) 67490 #endif 67491 67492 #ifdef __LITTLE_ENDIAN__ 67493 #define vsm3tt2bq_u32(__p0, __p1, __p2, __p3) __extension__ ({ \ 67494 uint32x4_t __ret; \ 67495 uint32x4_t __s0 = __p0; \ 67496 uint32x4_t __s1 = __p1; \ 67497 uint32x4_t __s2 = __p2; \ 67498 __ret = (uint32x4_t) __builtin_neon_vsm3tt2bq_u32((int8x16_t)__s0, (int8x16_t)__s1, (int8x16_t)__s2, __p3, 50); \ 67499 __ret; \ 67500 }) 67501 #else 67502 #define vsm3tt2bq_u32(__p0, __p1, __p2, __p3) __extension__ ({ \ 67503 uint32x4_t __ret; \ 67504 uint32x4_t __s0 = __p0; \ 67505 uint32x4_t __s1 = __p1; \ 67506 uint32x4_t __s2 = __p2; \ 67507 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__s0, __s0, 3, 2, 1, 0); \ 67508 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__s1, __s1, 3, 2, 1, 0); \ 67509 uint32x4_t __rev2; __rev2 = __builtin_shufflevector(__s2, __s2, 3, 2, 1, 0); \ 67510 __ret = (uint32x4_t) __builtin_neon_vsm3tt2bq_u32((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, __p3, 50); \ 67511 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); \ 67512 __ret; \ 67513 }) 67514 #endif 67515 67516 #ifdef __LITTLE_ENDIAN__ 67517 __ai __attribute__((target("sm4,neon"))) uint32x4_t vsm4eq_u32(uint32x4_t __p0, uint32x4_t __p1) { 67518 uint32x4_t __ret; 67519 __ret = (uint32x4_t) __builtin_neon_vsm4eq_u32((int8x16_t)__p0, (int8x16_t)__p1, 50); 67520 return __ret; 67521 } 67522 #else 67523 __ai __attribute__((target("sm4,neon"))) uint32x4_t vsm4eq_u32(uint32x4_t __p0, uint32x4_t __p1) { 67524 uint32x4_t __ret; 67525 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 67526 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 67527 __ret = (uint32x4_t) __builtin_neon_vsm4eq_u32((int8x16_t)__rev0, (int8x16_t)__rev1, 50); 67528 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 67529 return __ret; 67530 } 67531 #endif 67532 67533 #ifdef __LITTLE_ENDIAN__ 67534 __ai __attribute__((target("sm4,neon"))) uint32x4_t vsm4ekeyq_u32(uint32x4_t __p0, uint32x4_t __p1) { 67535 uint32x4_t __ret; 67536 __ret = (uint32x4_t) __builtin_neon_vsm4ekeyq_u32((int8x16_t)__p0, (int8x16_t)__p1, 50); 67537 return __ret; 67538 } 67539 #else 67540 __ai __attribute__((target("sm4,neon"))) uint32x4_t vsm4ekeyq_u32(uint32x4_t __p0, uint32x4_t __p1) { 67541 uint32x4_t __ret; 67542 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 67543 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 67544 __ret = (uint32x4_t) __builtin_neon_vsm4ekeyq_u32((int8x16_t)__rev0, (int8x16_t)__rev1, 50); 67545 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 67546 return __ret; 67547 } 67548 #endif 67549 67550 __ai __attribute__((target("v8.1a,neon"))) int32_t vqrdmlahs_s32(int32_t __p0, int32_t __p1, int32_t __p2) { 67551 int32_t __ret; 67552 __ret = (int32_t) __builtin_neon_vqrdmlahs_s32(__p0, __p1, __p2); 67553 return __ret; 67554 } 67555 __ai __attribute__((target("v8.1a,neon"))) int16_t vqrdmlahh_s16(int16_t __p0, int16_t __p1, int16_t __p2) { 67556 int16_t __ret; 67557 __ret = (int16_t) __builtin_neon_vqrdmlahh_s16(__p0, __p1, __p2); 67558 return __ret; 67559 } 67560 #ifdef __LITTLE_ENDIAN__ 67561 #define vqrdmlahs_lane_s32(__p0_760, __p1_760, __p2_760, __p3_760) __extension__ ({ \ 67562 int32_t __ret_760; \ 67563 int32_t __s0_760 = __p0_760; \ 67564 int32_t __s1_760 = __p1_760; \ 67565 int32x2_t __s2_760 = __p2_760; \ 67566 __ret_760 = vqrdmlahs_s32(__s0_760, __s1_760, vget_lane_s32(__s2_760, __p3_760)); \ 67567 __ret_760; \ 67568 }) 67569 #else 67570 #define vqrdmlahs_lane_s32(__p0_761, __p1_761, __p2_761, __p3_761) __extension__ ({ \ 67571 int32_t __ret_761; \ 67572 int32_t __s0_761 = __p0_761; \ 67573 int32_t __s1_761 = __p1_761; \ 67574 int32x2_t __s2_761 = __p2_761; \ 67575 int32x2_t __rev2_761; __rev2_761 = __builtin_shufflevector(__s2_761, __s2_761, 1, 0); \ 67576 __ret_761 = vqrdmlahs_s32(__s0_761, __s1_761, __noswap_vget_lane_s32(__rev2_761, __p3_761)); \ 67577 __ret_761; \ 67578 }) 67579 #endif 67580 67581 #ifdef __LITTLE_ENDIAN__ 67582 #define vqrdmlahh_lane_s16(__p0_762, __p1_762, __p2_762, __p3_762) __extension__ ({ \ 67583 int16_t __ret_762; \ 67584 int16_t __s0_762 = __p0_762; \ 67585 int16_t __s1_762 = __p1_762; \ 67586 int16x4_t __s2_762 = __p2_762; \ 67587 __ret_762 = vqrdmlahh_s16(__s0_762, __s1_762, vget_lane_s16(__s2_762, __p3_762)); \ 67588 __ret_762; \ 67589 }) 67590 #else 67591 #define vqrdmlahh_lane_s16(__p0_763, __p1_763, __p2_763, __p3_763) __extension__ ({ \ 67592 int16_t __ret_763; \ 67593 int16_t __s0_763 = __p0_763; \ 67594 int16_t __s1_763 = __p1_763; \ 67595 int16x4_t __s2_763 = __p2_763; \ 67596 int16x4_t __rev2_763; __rev2_763 = __builtin_shufflevector(__s2_763, __s2_763, 3, 2, 1, 0); \ 67597 __ret_763 = vqrdmlahh_s16(__s0_763, __s1_763, __noswap_vget_lane_s16(__rev2_763, __p3_763)); \ 67598 __ret_763; \ 67599 }) 67600 #endif 67601 67602 #ifdef __LITTLE_ENDIAN__ 67603 #define vqrdmlahs_laneq_s32(__p0_764, __p1_764, __p2_764, __p3_764) __extension__ ({ \ 67604 int32_t __ret_764; \ 67605 int32_t __s0_764 = __p0_764; \ 67606 int32_t __s1_764 = __p1_764; \ 67607 int32x4_t __s2_764 = __p2_764; \ 67608 __ret_764 = vqrdmlahs_s32(__s0_764, __s1_764, vgetq_lane_s32(__s2_764, __p3_764)); \ 67609 __ret_764; \ 67610 }) 67611 #else 67612 #define vqrdmlahs_laneq_s32(__p0_765, __p1_765, __p2_765, __p3_765) __extension__ ({ \ 67613 int32_t __ret_765; \ 67614 int32_t __s0_765 = __p0_765; \ 67615 int32_t __s1_765 = __p1_765; \ 67616 int32x4_t __s2_765 = __p2_765; \ 67617 int32x4_t __rev2_765; __rev2_765 = __builtin_shufflevector(__s2_765, __s2_765, 3, 2, 1, 0); \ 67618 __ret_765 = vqrdmlahs_s32(__s0_765, __s1_765, __noswap_vgetq_lane_s32(__rev2_765, __p3_765)); \ 67619 __ret_765; \ 67620 }) 67621 #endif 67622 67623 #ifdef __LITTLE_ENDIAN__ 67624 #define vqrdmlahh_laneq_s16(__p0_766, __p1_766, __p2_766, __p3_766) __extension__ ({ \ 67625 int16_t __ret_766; \ 67626 int16_t __s0_766 = __p0_766; \ 67627 int16_t __s1_766 = __p1_766; \ 67628 int16x8_t __s2_766 = __p2_766; \ 67629 __ret_766 = vqrdmlahh_s16(__s0_766, __s1_766, vgetq_lane_s16(__s2_766, __p3_766)); \ 67630 __ret_766; \ 67631 }) 67632 #else 67633 #define vqrdmlahh_laneq_s16(__p0_767, __p1_767, __p2_767, __p3_767) __extension__ ({ \ 67634 int16_t __ret_767; \ 67635 int16_t __s0_767 = __p0_767; \ 67636 int16_t __s1_767 = __p1_767; \ 67637 int16x8_t __s2_767 = __p2_767; \ 67638 int16x8_t __rev2_767; __rev2_767 = __builtin_shufflevector(__s2_767, __s2_767, 7, 6, 5, 4, 3, 2, 1, 0); \ 67639 __ret_767 = vqrdmlahh_s16(__s0_767, __s1_767, __noswap_vgetq_lane_s16(__rev2_767, __p3_767)); \ 67640 __ret_767; \ 67641 }) 67642 #endif 67643 67644 #ifdef __LITTLE_ENDIAN__ 67645 #define vqrdmlahq_laneq_s32(__p0_768, __p1_768, __p2_768, __p3_768) __extension__ ({ \ 67646 int32x4_t __ret_768; \ 67647 int32x4_t __s0_768 = __p0_768; \ 67648 int32x4_t __s1_768 = __p1_768; \ 67649 int32x4_t __s2_768 = __p2_768; \ 67650 __ret_768 = vqrdmlahq_s32(__s0_768, __s1_768, splatq_laneq_s32(__s2_768, __p3_768)); \ 67651 __ret_768; \ 67652 }) 67653 #else 67654 #define vqrdmlahq_laneq_s32(__p0_769, __p1_769, __p2_769, __p3_769) __extension__ ({ \ 67655 int32x4_t __ret_769; \ 67656 int32x4_t __s0_769 = __p0_769; \ 67657 int32x4_t __s1_769 = __p1_769; \ 67658 int32x4_t __s2_769 = __p2_769; \ 67659 int32x4_t __rev0_769; __rev0_769 = __builtin_shufflevector(__s0_769, __s0_769, 3, 2, 1, 0); \ 67660 int32x4_t __rev1_769; __rev1_769 = __builtin_shufflevector(__s1_769, __s1_769, 3, 2, 1, 0); \ 67661 int32x4_t __rev2_769; __rev2_769 = __builtin_shufflevector(__s2_769, __s2_769, 3, 2, 1, 0); \ 67662 __ret_769 = __noswap_vqrdmlahq_s32(__rev0_769, __rev1_769, __noswap_splatq_laneq_s32(__rev2_769, __p3_769)); \ 67663 __ret_769 = __builtin_shufflevector(__ret_769, __ret_769, 3, 2, 1, 0); \ 67664 __ret_769; \ 67665 }) 67666 #endif 67667 67668 #ifdef __LITTLE_ENDIAN__ 67669 #define vqrdmlahq_laneq_s16(__p0_770, __p1_770, __p2_770, __p3_770) __extension__ ({ \ 67670 int16x8_t __ret_770; \ 67671 int16x8_t __s0_770 = __p0_770; \ 67672 int16x8_t __s1_770 = __p1_770; \ 67673 int16x8_t __s2_770 = __p2_770; \ 67674 __ret_770 = vqrdmlahq_s16(__s0_770, __s1_770, splatq_laneq_s16(__s2_770, __p3_770)); \ 67675 __ret_770; \ 67676 }) 67677 #else 67678 #define vqrdmlahq_laneq_s16(__p0_771, __p1_771, __p2_771, __p3_771) __extension__ ({ \ 67679 int16x8_t __ret_771; \ 67680 int16x8_t __s0_771 = __p0_771; \ 67681 int16x8_t __s1_771 = __p1_771; \ 67682 int16x8_t __s2_771 = __p2_771; \ 67683 int16x8_t __rev0_771; __rev0_771 = __builtin_shufflevector(__s0_771, __s0_771, 7, 6, 5, 4, 3, 2, 1, 0); \ 67684 int16x8_t __rev1_771; __rev1_771 = __builtin_shufflevector(__s1_771, __s1_771, 7, 6, 5, 4, 3, 2, 1, 0); \ 67685 int16x8_t __rev2_771; __rev2_771 = __builtin_shufflevector(__s2_771, __s2_771, 7, 6, 5, 4, 3, 2, 1, 0); \ 67686 __ret_771 = __noswap_vqrdmlahq_s16(__rev0_771, __rev1_771, __noswap_splatq_laneq_s16(__rev2_771, __p3_771)); \ 67687 __ret_771 = __builtin_shufflevector(__ret_771, __ret_771, 7, 6, 5, 4, 3, 2, 1, 0); \ 67688 __ret_771; \ 67689 }) 67690 #endif 67691 67692 #ifdef __LITTLE_ENDIAN__ 67693 #define vqrdmlah_laneq_s32(__p0_772, __p1_772, __p2_772, __p3_772) __extension__ ({ \ 67694 int32x2_t __ret_772; \ 67695 int32x2_t __s0_772 = __p0_772; \ 67696 int32x2_t __s1_772 = __p1_772; \ 67697 int32x4_t __s2_772 = __p2_772; \ 67698 __ret_772 = vqrdmlah_s32(__s0_772, __s1_772, splat_laneq_s32(__s2_772, __p3_772)); \ 67699 __ret_772; \ 67700 }) 67701 #else 67702 #define vqrdmlah_laneq_s32(__p0_773, __p1_773, __p2_773, __p3_773) __extension__ ({ \ 67703 int32x2_t __ret_773; \ 67704 int32x2_t __s0_773 = __p0_773; \ 67705 int32x2_t __s1_773 = __p1_773; \ 67706 int32x4_t __s2_773 = __p2_773; \ 67707 int32x2_t __rev0_773; __rev0_773 = __builtin_shufflevector(__s0_773, __s0_773, 1, 0); \ 67708 int32x2_t __rev1_773; __rev1_773 = __builtin_shufflevector(__s1_773, __s1_773, 1, 0); \ 67709 int32x4_t __rev2_773; __rev2_773 = __builtin_shufflevector(__s2_773, __s2_773, 3, 2, 1, 0); \ 67710 __ret_773 = __noswap_vqrdmlah_s32(__rev0_773, __rev1_773, __noswap_splat_laneq_s32(__rev2_773, __p3_773)); \ 67711 __ret_773 = __builtin_shufflevector(__ret_773, __ret_773, 1, 0); \ 67712 __ret_773; \ 67713 }) 67714 #endif 67715 67716 #ifdef __LITTLE_ENDIAN__ 67717 #define vqrdmlah_laneq_s16(__p0_774, __p1_774, __p2_774, __p3_774) __extension__ ({ \ 67718 int16x4_t __ret_774; \ 67719 int16x4_t __s0_774 = __p0_774; \ 67720 int16x4_t __s1_774 = __p1_774; \ 67721 int16x8_t __s2_774 = __p2_774; \ 67722 __ret_774 = vqrdmlah_s16(__s0_774, __s1_774, splat_laneq_s16(__s2_774, __p3_774)); \ 67723 __ret_774; \ 67724 }) 67725 #else 67726 #define vqrdmlah_laneq_s16(__p0_775, __p1_775, __p2_775, __p3_775) __extension__ ({ \ 67727 int16x4_t __ret_775; \ 67728 int16x4_t __s0_775 = __p0_775; \ 67729 int16x4_t __s1_775 = __p1_775; \ 67730 int16x8_t __s2_775 = __p2_775; \ 67731 int16x4_t __rev0_775; __rev0_775 = __builtin_shufflevector(__s0_775, __s0_775, 3, 2, 1, 0); \ 67732 int16x4_t __rev1_775; __rev1_775 = __builtin_shufflevector(__s1_775, __s1_775, 3, 2, 1, 0); \ 67733 int16x8_t __rev2_775; __rev2_775 = __builtin_shufflevector(__s2_775, __s2_775, 7, 6, 5, 4, 3, 2, 1, 0); \ 67734 __ret_775 = __noswap_vqrdmlah_s16(__rev0_775, __rev1_775, __noswap_splat_laneq_s16(__rev2_775, __p3_775)); \ 67735 __ret_775 = __builtin_shufflevector(__ret_775, __ret_775, 3, 2, 1, 0); \ 67736 __ret_775; \ 67737 }) 67738 #endif 67739 67740 __ai __attribute__((target("v8.1a,neon"))) int32_t vqrdmlshs_s32(int32_t __p0, int32_t __p1, int32_t __p2) { 67741 int32_t __ret; 67742 __ret = (int32_t) __builtin_neon_vqrdmlshs_s32(__p0, __p1, __p2); 67743 return __ret; 67744 } 67745 __ai __attribute__((target("v8.1a,neon"))) int16_t vqrdmlshh_s16(int16_t __p0, int16_t __p1, int16_t __p2) { 67746 int16_t __ret; 67747 __ret = (int16_t) __builtin_neon_vqrdmlshh_s16(__p0, __p1, __p2); 67748 return __ret; 67749 } 67750 #ifdef __LITTLE_ENDIAN__ 67751 #define vqrdmlshs_lane_s32(__p0_776, __p1_776, __p2_776, __p3_776) __extension__ ({ \ 67752 int32_t __ret_776; \ 67753 int32_t __s0_776 = __p0_776; \ 67754 int32_t __s1_776 = __p1_776; \ 67755 int32x2_t __s2_776 = __p2_776; \ 67756 __ret_776 = vqrdmlshs_s32(__s0_776, __s1_776, vget_lane_s32(__s2_776, __p3_776)); \ 67757 __ret_776; \ 67758 }) 67759 #else 67760 #define vqrdmlshs_lane_s32(__p0_777, __p1_777, __p2_777, __p3_777) __extension__ ({ \ 67761 int32_t __ret_777; \ 67762 int32_t __s0_777 = __p0_777; \ 67763 int32_t __s1_777 = __p1_777; \ 67764 int32x2_t __s2_777 = __p2_777; \ 67765 int32x2_t __rev2_777; __rev2_777 = __builtin_shufflevector(__s2_777, __s2_777, 1, 0); \ 67766 __ret_777 = vqrdmlshs_s32(__s0_777, __s1_777, __noswap_vget_lane_s32(__rev2_777, __p3_777)); \ 67767 __ret_777; \ 67768 }) 67769 #endif 67770 67771 #ifdef __LITTLE_ENDIAN__ 67772 #define vqrdmlshh_lane_s16(__p0_778, __p1_778, __p2_778, __p3_778) __extension__ ({ \ 67773 int16_t __ret_778; \ 67774 int16_t __s0_778 = __p0_778; \ 67775 int16_t __s1_778 = __p1_778; \ 67776 int16x4_t __s2_778 = __p2_778; \ 67777 __ret_778 = vqrdmlshh_s16(__s0_778, __s1_778, vget_lane_s16(__s2_778, __p3_778)); \ 67778 __ret_778; \ 67779 }) 67780 #else 67781 #define vqrdmlshh_lane_s16(__p0_779, __p1_779, __p2_779, __p3_779) __extension__ ({ \ 67782 int16_t __ret_779; \ 67783 int16_t __s0_779 = __p0_779; \ 67784 int16_t __s1_779 = __p1_779; \ 67785 int16x4_t __s2_779 = __p2_779; \ 67786 int16x4_t __rev2_779; __rev2_779 = __builtin_shufflevector(__s2_779, __s2_779, 3, 2, 1, 0); \ 67787 __ret_779 = vqrdmlshh_s16(__s0_779, __s1_779, __noswap_vget_lane_s16(__rev2_779, __p3_779)); \ 67788 __ret_779; \ 67789 }) 67790 #endif 67791 67792 #ifdef __LITTLE_ENDIAN__ 67793 #define vqrdmlshs_laneq_s32(__p0_780, __p1_780, __p2_780, __p3_780) __extension__ ({ \ 67794 int32_t __ret_780; \ 67795 int32_t __s0_780 = __p0_780; \ 67796 int32_t __s1_780 = __p1_780; \ 67797 int32x4_t __s2_780 = __p2_780; \ 67798 __ret_780 = vqrdmlshs_s32(__s0_780, __s1_780, vgetq_lane_s32(__s2_780, __p3_780)); \ 67799 __ret_780; \ 67800 }) 67801 #else 67802 #define vqrdmlshs_laneq_s32(__p0_781, __p1_781, __p2_781, __p3_781) __extension__ ({ \ 67803 int32_t __ret_781; \ 67804 int32_t __s0_781 = __p0_781; \ 67805 int32_t __s1_781 = __p1_781; \ 67806 int32x4_t __s2_781 = __p2_781; \ 67807 int32x4_t __rev2_781; __rev2_781 = __builtin_shufflevector(__s2_781, __s2_781, 3, 2, 1, 0); \ 67808 __ret_781 = vqrdmlshs_s32(__s0_781, __s1_781, __noswap_vgetq_lane_s32(__rev2_781, __p3_781)); \ 67809 __ret_781; \ 67810 }) 67811 #endif 67812 67813 #ifdef __LITTLE_ENDIAN__ 67814 #define vqrdmlshh_laneq_s16(__p0_782, __p1_782, __p2_782, __p3_782) __extension__ ({ \ 67815 int16_t __ret_782; \ 67816 int16_t __s0_782 = __p0_782; \ 67817 int16_t __s1_782 = __p1_782; \ 67818 int16x8_t __s2_782 = __p2_782; \ 67819 __ret_782 = vqrdmlshh_s16(__s0_782, __s1_782, vgetq_lane_s16(__s2_782, __p3_782)); \ 67820 __ret_782; \ 67821 }) 67822 #else 67823 #define vqrdmlshh_laneq_s16(__p0_783, __p1_783, __p2_783, __p3_783) __extension__ ({ \ 67824 int16_t __ret_783; \ 67825 int16_t __s0_783 = __p0_783; \ 67826 int16_t __s1_783 = __p1_783; \ 67827 int16x8_t __s2_783 = __p2_783; \ 67828 int16x8_t __rev2_783; __rev2_783 = __builtin_shufflevector(__s2_783, __s2_783, 7, 6, 5, 4, 3, 2, 1, 0); \ 67829 __ret_783 = vqrdmlshh_s16(__s0_783, __s1_783, __noswap_vgetq_lane_s16(__rev2_783, __p3_783)); \ 67830 __ret_783; \ 67831 }) 67832 #endif 67833 67834 #ifdef __LITTLE_ENDIAN__ 67835 #define vqrdmlshq_laneq_s32(__p0_784, __p1_784, __p2_784, __p3_784) __extension__ ({ \ 67836 int32x4_t __ret_784; \ 67837 int32x4_t __s0_784 = __p0_784; \ 67838 int32x4_t __s1_784 = __p1_784; \ 67839 int32x4_t __s2_784 = __p2_784; \ 67840 __ret_784 = vqrdmlshq_s32(__s0_784, __s1_784, splatq_laneq_s32(__s2_784, __p3_784)); \ 67841 __ret_784; \ 67842 }) 67843 #else 67844 #define vqrdmlshq_laneq_s32(__p0_785, __p1_785, __p2_785, __p3_785) __extension__ ({ \ 67845 int32x4_t __ret_785; \ 67846 int32x4_t __s0_785 = __p0_785; \ 67847 int32x4_t __s1_785 = __p1_785; \ 67848 int32x4_t __s2_785 = __p2_785; \ 67849 int32x4_t __rev0_785; __rev0_785 = __builtin_shufflevector(__s0_785, __s0_785, 3, 2, 1, 0); \ 67850 int32x4_t __rev1_785; __rev1_785 = __builtin_shufflevector(__s1_785, __s1_785, 3, 2, 1, 0); \ 67851 int32x4_t __rev2_785; __rev2_785 = __builtin_shufflevector(__s2_785, __s2_785, 3, 2, 1, 0); \ 67852 __ret_785 = __noswap_vqrdmlshq_s32(__rev0_785, __rev1_785, __noswap_splatq_laneq_s32(__rev2_785, __p3_785)); \ 67853 __ret_785 = __builtin_shufflevector(__ret_785, __ret_785, 3, 2, 1, 0); \ 67854 __ret_785; \ 67855 }) 67856 #endif 67857 67858 #ifdef __LITTLE_ENDIAN__ 67859 #define vqrdmlshq_laneq_s16(__p0_786, __p1_786, __p2_786, __p3_786) __extension__ ({ \ 67860 int16x8_t __ret_786; \ 67861 int16x8_t __s0_786 = __p0_786; \ 67862 int16x8_t __s1_786 = __p1_786; \ 67863 int16x8_t __s2_786 = __p2_786; \ 67864 __ret_786 = vqrdmlshq_s16(__s0_786, __s1_786, splatq_laneq_s16(__s2_786, __p3_786)); \ 67865 __ret_786; \ 67866 }) 67867 #else 67868 #define vqrdmlshq_laneq_s16(__p0_787, __p1_787, __p2_787, __p3_787) __extension__ ({ \ 67869 int16x8_t __ret_787; \ 67870 int16x8_t __s0_787 = __p0_787; \ 67871 int16x8_t __s1_787 = __p1_787; \ 67872 int16x8_t __s2_787 = __p2_787; \ 67873 int16x8_t __rev0_787; __rev0_787 = __builtin_shufflevector(__s0_787, __s0_787, 7, 6, 5, 4, 3, 2, 1, 0); \ 67874 int16x8_t __rev1_787; __rev1_787 = __builtin_shufflevector(__s1_787, __s1_787, 7, 6, 5, 4, 3, 2, 1, 0); \ 67875 int16x8_t __rev2_787; __rev2_787 = __builtin_shufflevector(__s2_787, __s2_787, 7, 6, 5, 4, 3, 2, 1, 0); \ 67876 __ret_787 = __noswap_vqrdmlshq_s16(__rev0_787, __rev1_787, __noswap_splatq_laneq_s16(__rev2_787, __p3_787)); \ 67877 __ret_787 = __builtin_shufflevector(__ret_787, __ret_787, 7, 6, 5, 4, 3, 2, 1, 0); \ 67878 __ret_787; \ 67879 }) 67880 #endif 67881 67882 #ifdef __LITTLE_ENDIAN__ 67883 #define vqrdmlsh_laneq_s32(__p0_788, __p1_788, __p2_788, __p3_788) __extension__ ({ \ 67884 int32x2_t __ret_788; \ 67885 int32x2_t __s0_788 = __p0_788; \ 67886 int32x2_t __s1_788 = __p1_788; \ 67887 int32x4_t __s2_788 = __p2_788; \ 67888 __ret_788 = vqrdmlsh_s32(__s0_788, __s1_788, splat_laneq_s32(__s2_788, __p3_788)); \ 67889 __ret_788; \ 67890 }) 67891 #else 67892 #define vqrdmlsh_laneq_s32(__p0_789, __p1_789, __p2_789, __p3_789) __extension__ ({ \ 67893 int32x2_t __ret_789; \ 67894 int32x2_t __s0_789 = __p0_789; \ 67895 int32x2_t __s1_789 = __p1_789; \ 67896 int32x4_t __s2_789 = __p2_789; \ 67897 int32x2_t __rev0_789; __rev0_789 = __builtin_shufflevector(__s0_789, __s0_789, 1, 0); \ 67898 int32x2_t __rev1_789; __rev1_789 = __builtin_shufflevector(__s1_789, __s1_789, 1, 0); \ 67899 int32x4_t __rev2_789; __rev2_789 = __builtin_shufflevector(__s2_789, __s2_789, 3, 2, 1, 0); \ 67900 __ret_789 = __noswap_vqrdmlsh_s32(__rev0_789, __rev1_789, __noswap_splat_laneq_s32(__rev2_789, __p3_789)); \ 67901 __ret_789 = __builtin_shufflevector(__ret_789, __ret_789, 1, 0); \ 67902 __ret_789; \ 67903 }) 67904 #endif 67905 67906 #ifdef __LITTLE_ENDIAN__ 67907 #define vqrdmlsh_laneq_s16(__p0_790, __p1_790, __p2_790, __p3_790) __extension__ ({ \ 67908 int16x4_t __ret_790; \ 67909 int16x4_t __s0_790 = __p0_790; \ 67910 int16x4_t __s1_790 = __p1_790; \ 67911 int16x8_t __s2_790 = __p2_790; \ 67912 __ret_790 = vqrdmlsh_s16(__s0_790, __s1_790, splat_laneq_s16(__s2_790, __p3_790)); \ 67913 __ret_790; \ 67914 }) 67915 #else 67916 #define vqrdmlsh_laneq_s16(__p0_791, __p1_791, __p2_791, __p3_791) __extension__ ({ \ 67917 int16x4_t __ret_791; \ 67918 int16x4_t __s0_791 = __p0_791; \ 67919 int16x4_t __s1_791 = __p1_791; \ 67920 int16x8_t __s2_791 = __p2_791; \ 67921 int16x4_t __rev0_791; __rev0_791 = __builtin_shufflevector(__s0_791, __s0_791, 3, 2, 1, 0); \ 67922 int16x4_t __rev1_791; __rev1_791 = __builtin_shufflevector(__s1_791, __s1_791, 3, 2, 1, 0); \ 67923 int16x8_t __rev2_791; __rev2_791 = __builtin_shufflevector(__s2_791, __s2_791, 7, 6, 5, 4, 3, 2, 1, 0); \ 67924 __ret_791 = __noswap_vqrdmlsh_s16(__rev0_791, __rev1_791, __noswap_splat_laneq_s16(__rev2_791, __p3_791)); \ 67925 __ret_791 = __builtin_shufflevector(__ret_791, __ret_791, 3, 2, 1, 0); \ 67926 __ret_791; \ 67927 }) 67928 #endif 67929 67930 #ifdef __LITTLE_ENDIAN__ 67931 __ai __attribute__((target("v8.3a,neon"))) float64x2_t vcaddq_rot270_f64(float64x2_t __p0, float64x2_t __p1) { 67932 float64x2_t __ret; 67933 __ret = (float64x2_t) __builtin_neon_vcaddq_rot270_f64((int8x16_t)__p0, (int8x16_t)__p1, 42); 67934 return __ret; 67935 } 67936 #else 67937 __ai __attribute__((target("v8.3a,neon"))) float64x2_t vcaddq_rot270_f64(float64x2_t __p0, float64x2_t __p1) { 67938 float64x2_t __ret; 67939 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 67940 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 67941 __ret = (float64x2_t) __builtin_neon_vcaddq_rot270_f64((int8x16_t)__rev0, (int8x16_t)__rev1, 42); 67942 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 67943 return __ret; 67944 } 67945 #endif 67946 67947 #ifdef __LITTLE_ENDIAN__ 67948 __ai __attribute__((target("v8.3a,neon"))) float64x2_t vcaddq_rot90_f64(float64x2_t __p0, float64x2_t __p1) { 67949 float64x2_t __ret; 67950 __ret = (float64x2_t) __builtin_neon_vcaddq_rot90_f64((int8x16_t)__p0, (int8x16_t)__p1, 42); 67951 return __ret; 67952 } 67953 #else 67954 __ai __attribute__((target("v8.3a,neon"))) float64x2_t vcaddq_rot90_f64(float64x2_t __p0, float64x2_t __p1) { 67955 float64x2_t __ret; 67956 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 67957 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 67958 __ret = (float64x2_t) __builtin_neon_vcaddq_rot90_f64((int8x16_t)__rev0, (int8x16_t)__rev1, 42); 67959 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 67960 return __ret; 67961 } 67962 #endif 67963 67964 #ifdef __LITTLE_ENDIAN__ 67965 __ai __attribute__((target("v8.3a,neon"))) float64x2_t vcmlaq_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) { 67966 float64x2_t __ret; 67967 __ret = (float64x2_t) __builtin_neon_vcmlaq_f64((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 42); 67968 return __ret; 67969 } 67970 #else 67971 __ai __attribute__((target("v8.3a,neon"))) float64x2_t vcmlaq_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) { 67972 float64x2_t __ret; 67973 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 67974 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 67975 float64x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 67976 __ret = (float64x2_t) __builtin_neon_vcmlaq_f64((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 42); 67977 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 67978 return __ret; 67979 } 67980 #endif 67981 67982 #ifdef __LITTLE_ENDIAN__ 67983 __ai __attribute__((target("v8.3a,neon"))) float64x2_t vcmlaq_rot180_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) { 67984 float64x2_t __ret; 67985 __ret = (float64x2_t) __builtin_neon_vcmlaq_rot180_f64((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 42); 67986 return __ret; 67987 } 67988 #else 67989 __ai __attribute__((target("v8.3a,neon"))) float64x2_t vcmlaq_rot180_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) { 67990 float64x2_t __ret; 67991 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 67992 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 67993 float64x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 67994 __ret = (float64x2_t) __builtin_neon_vcmlaq_rot180_f64((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 42); 67995 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 67996 return __ret; 67997 } 67998 #endif 67999 68000 #ifdef __LITTLE_ENDIAN__ 68001 __ai __attribute__((target("v8.3a,neon"))) float64x2_t vcmlaq_rot270_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) { 68002 float64x2_t __ret; 68003 __ret = (float64x2_t) __builtin_neon_vcmlaq_rot270_f64((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 42); 68004 return __ret; 68005 } 68006 #else 68007 __ai __attribute__((target("v8.3a,neon"))) float64x2_t vcmlaq_rot270_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) { 68008 float64x2_t __ret; 68009 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 68010 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 68011 float64x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 68012 __ret = (float64x2_t) __builtin_neon_vcmlaq_rot270_f64((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 42); 68013 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 68014 return __ret; 68015 } 68016 #endif 68017 68018 #ifdef __LITTLE_ENDIAN__ 68019 __ai __attribute__((target("v8.3a,neon"))) float64x2_t vcmlaq_rot90_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) { 68020 float64x2_t __ret; 68021 __ret = (float64x2_t) __builtin_neon_vcmlaq_rot90_f64((int8x16_t)__p0, (int8x16_t)__p1, (int8x16_t)__p2, 42); 68022 return __ret; 68023 } 68024 #else 68025 __ai __attribute__((target("v8.3a,neon"))) float64x2_t vcmlaq_rot90_f64(float64x2_t __p0, float64x2_t __p1, float64x2_t __p2) { 68026 float64x2_t __ret; 68027 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 68028 float64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 68029 float64x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 68030 __ret = (float64x2_t) __builtin_neon_vcmlaq_rot90_f64((int8x16_t)__rev0, (int8x16_t)__rev1, (int8x16_t)__rev2, 42); 68031 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 68032 return __ret; 68033 } 68034 #endif 68035 68036 #ifdef __LITTLE_ENDIAN__ 68037 __ai __attribute__((target("v8.5a,neon"))) float32x4_t vrnd32xq_f32(float32x4_t __p0) { 68038 float32x4_t __ret; 68039 __ret = (float32x4_t) __builtin_neon_vrnd32xq_f32((int8x16_t)__p0, 41); 68040 return __ret; 68041 } 68042 #else 68043 __ai __attribute__((target("v8.5a,neon"))) float32x4_t vrnd32xq_f32(float32x4_t __p0) { 68044 float32x4_t __ret; 68045 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 68046 __ret = (float32x4_t) __builtin_neon_vrnd32xq_f32((int8x16_t)__rev0, 41); 68047 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 68048 return __ret; 68049 } 68050 #endif 68051 68052 #ifdef __LITTLE_ENDIAN__ 68053 __ai __attribute__((target("v8.5a,neon"))) float32x2_t vrnd32x_f32(float32x2_t __p0) { 68054 float32x2_t __ret; 68055 __ret = (float32x2_t) __builtin_neon_vrnd32x_f32((int8x8_t)__p0, 9); 68056 return __ret; 68057 } 68058 #else 68059 __ai __attribute__((target("v8.5a,neon"))) float32x2_t vrnd32x_f32(float32x2_t __p0) { 68060 float32x2_t __ret; 68061 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 68062 __ret = (float32x2_t) __builtin_neon_vrnd32x_f32((int8x8_t)__rev0, 9); 68063 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 68064 return __ret; 68065 } 68066 #endif 68067 68068 #ifdef __LITTLE_ENDIAN__ 68069 __ai __attribute__((target("v8.5a,neon"))) float64x2_t vrnd32xq_f64(float64x2_t __p0) { 68070 float64x2_t __ret; 68071 __ret = (float64x2_t) __builtin_neon_vrnd32xq_f64((int8x16_t)__p0, 42); 68072 return __ret; 68073 } 68074 #else 68075 __ai __attribute__((target("v8.5a,neon"))) float64x2_t vrnd32xq_f64(float64x2_t __p0) { 68076 float64x2_t __ret; 68077 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 68078 __ret = (float64x2_t) __builtin_neon_vrnd32xq_f64((int8x16_t)__rev0, 42); 68079 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 68080 return __ret; 68081 } 68082 #endif 68083 68084 __ai __attribute__((target("v8.5a,neon"))) float64x1_t vrnd32x_f64(float64x1_t __p0) { 68085 float64x1_t __ret; 68086 __ret = (float64x1_t) __builtin_neon_vrnd32x_f64((int8x8_t)__p0, 10); 68087 return __ret; 68088 } 68089 #ifdef __LITTLE_ENDIAN__ 68090 __ai __attribute__((target("v8.5a,neon"))) float32x4_t vrnd32zq_f32(float32x4_t __p0) { 68091 float32x4_t __ret; 68092 __ret = (float32x4_t) __builtin_neon_vrnd32zq_f32((int8x16_t)__p0, 41); 68093 return __ret; 68094 } 68095 #else 68096 __ai __attribute__((target("v8.5a,neon"))) float32x4_t vrnd32zq_f32(float32x4_t __p0) { 68097 float32x4_t __ret; 68098 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 68099 __ret = (float32x4_t) __builtin_neon_vrnd32zq_f32((int8x16_t)__rev0, 41); 68100 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 68101 return __ret; 68102 } 68103 #endif 68104 68105 #ifdef __LITTLE_ENDIAN__ 68106 __ai __attribute__((target("v8.5a,neon"))) float32x2_t vrnd32z_f32(float32x2_t __p0) { 68107 float32x2_t __ret; 68108 __ret = (float32x2_t) __builtin_neon_vrnd32z_f32((int8x8_t)__p0, 9); 68109 return __ret; 68110 } 68111 #else 68112 __ai __attribute__((target("v8.5a,neon"))) float32x2_t vrnd32z_f32(float32x2_t __p0) { 68113 float32x2_t __ret; 68114 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 68115 __ret = (float32x2_t) __builtin_neon_vrnd32z_f32((int8x8_t)__rev0, 9); 68116 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 68117 return __ret; 68118 } 68119 #endif 68120 68121 #ifdef __LITTLE_ENDIAN__ 68122 __ai __attribute__((target("v8.5a,neon"))) float64x2_t vrnd32zq_f64(float64x2_t __p0) { 68123 float64x2_t __ret; 68124 __ret = (float64x2_t) __builtin_neon_vrnd32zq_f64((int8x16_t)__p0, 42); 68125 return __ret; 68126 } 68127 #else 68128 __ai __attribute__((target("v8.5a,neon"))) float64x2_t vrnd32zq_f64(float64x2_t __p0) { 68129 float64x2_t __ret; 68130 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 68131 __ret = (float64x2_t) __builtin_neon_vrnd32zq_f64((int8x16_t)__rev0, 42); 68132 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 68133 return __ret; 68134 } 68135 #endif 68136 68137 __ai __attribute__((target("v8.5a,neon"))) float64x1_t vrnd32z_f64(float64x1_t __p0) { 68138 float64x1_t __ret; 68139 __ret = (float64x1_t) __builtin_neon_vrnd32z_f64((int8x8_t)__p0, 10); 68140 return __ret; 68141 } 68142 #ifdef __LITTLE_ENDIAN__ 68143 __ai __attribute__((target("v8.5a,neon"))) float32x4_t vrnd64xq_f32(float32x4_t __p0) { 68144 float32x4_t __ret; 68145 __ret = (float32x4_t) __builtin_neon_vrnd64xq_f32((int8x16_t)__p0, 41); 68146 return __ret; 68147 } 68148 #else 68149 __ai __attribute__((target("v8.5a,neon"))) float32x4_t vrnd64xq_f32(float32x4_t __p0) { 68150 float32x4_t __ret; 68151 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 68152 __ret = (float32x4_t) __builtin_neon_vrnd64xq_f32((int8x16_t)__rev0, 41); 68153 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 68154 return __ret; 68155 } 68156 #endif 68157 68158 #ifdef __LITTLE_ENDIAN__ 68159 __ai __attribute__((target("v8.5a,neon"))) float32x2_t vrnd64x_f32(float32x2_t __p0) { 68160 float32x2_t __ret; 68161 __ret = (float32x2_t) __builtin_neon_vrnd64x_f32((int8x8_t)__p0, 9); 68162 return __ret; 68163 } 68164 #else 68165 __ai __attribute__((target("v8.5a,neon"))) float32x2_t vrnd64x_f32(float32x2_t __p0) { 68166 float32x2_t __ret; 68167 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 68168 __ret = (float32x2_t) __builtin_neon_vrnd64x_f32((int8x8_t)__rev0, 9); 68169 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 68170 return __ret; 68171 } 68172 #endif 68173 68174 #ifdef __LITTLE_ENDIAN__ 68175 __ai __attribute__((target("v8.5a,neon"))) float64x2_t vrnd64xq_f64(float64x2_t __p0) { 68176 float64x2_t __ret; 68177 __ret = (float64x2_t) __builtin_neon_vrnd64xq_f64((int8x16_t)__p0, 42); 68178 return __ret; 68179 } 68180 #else 68181 __ai __attribute__((target("v8.5a,neon"))) float64x2_t vrnd64xq_f64(float64x2_t __p0) { 68182 float64x2_t __ret; 68183 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 68184 __ret = (float64x2_t) __builtin_neon_vrnd64xq_f64((int8x16_t)__rev0, 42); 68185 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 68186 return __ret; 68187 } 68188 #endif 68189 68190 __ai __attribute__((target("v8.5a,neon"))) float64x1_t vrnd64x_f64(float64x1_t __p0) { 68191 float64x1_t __ret; 68192 __ret = (float64x1_t) __builtin_neon_vrnd64x_f64((int8x8_t)__p0, 10); 68193 return __ret; 68194 } 68195 #ifdef __LITTLE_ENDIAN__ 68196 __ai __attribute__((target("v8.5a,neon"))) float32x4_t vrnd64zq_f32(float32x4_t __p0) { 68197 float32x4_t __ret; 68198 __ret = (float32x4_t) __builtin_neon_vrnd64zq_f32((int8x16_t)__p0, 41); 68199 return __ret; 68200 } 68201 #else 68202 __ai __attribute__((target("v8.5a,neon"))) float32x4_t vrnd64zq_f32(float32x4_t __p0) { 68203 float32x4_t __ret; 68204 float32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 68205 __ret = (float32x4_t) __builtin_neon_vrnd64zq_f32((int8x16_t)__rev0, 41); 68206 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 68207 return __ret; 68208 } 68209 #endif 68210 68211 #ifdef __LITTLE_ENDIAN__ 68212 __ai __attribute__((target("v8.5a,neon"))) float32x2_t vrnd64z_f32(float32x2_t __p0) { 68213 float32x2_t __ret; 68214 __ret = (float32x2_t) __builtin_neon_vrnd64z_f32((int8x8_t)__p0, 9); 68215 return __ret; 68216 } 68217 #else 68218 __ai __attribute__((target("v8.5a,neon"))) float32x2_t vrnd64z_f32(float32x2_t __p0) { 68219 float32x2_t __ret; 68220 float32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 68221 __ret = (float32x2_t) __builtin_neon_vrnd64z_f32((int8x8_t)__rev0, 9); 68222 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 68223 return __ret; 68224 } 68225 #endif 68226 68227 #ifdef __LITTLE_ENDIAN__ 68228 __ai __attribute__((target("v8.5a,neon"))) float64x2_t vrnd64zq_f64(float64x2_t __p0) { 68229 float64x2_t __ret; 68230 __ret = (float64x2_t) __builtin_neon_vrnd64zq_f64((int8x16_t)__p0, 42); 68231 return __ret; 68232 } 68233 #else 68234 __ai __attribute__((target("v8.5a,neon"))) float64x2_t vrnd64zq_f64(float64x2_t __p0) { 68235 float64x2_t __ret; 68236 float64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 68237 __ret = (float64x2_t) __builtin_neon_vrnd64zq_f64((int8x16_t)__rev0, 42); 68238 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 68239 return __ret; 68240 } 68241 #endif 68242 68243 __ai __attribute__((target("v8.5a,neon"))) float64x1_t vrnd64z_f64(float64x1_t __p0) { 68244 float64x1_t __ret; 68245 __ret = (float64x1_t) __builtin_neon_vrnd64z_f64((int8x8_t)__p0, 10); 68246 return __ret; 68247 } 68248 #endif 68249 #ifdef __LITTLE_ENDIAN__ 68250 #define vbfdotq_lane_f32(__p0_792, __p1_792, __p2_792, __p3_792) __extension__ ({ \ 68251 float32x4_t __ret_792; \ 68252 float32x4_t __s0_792 = __p0_792; \ 68253 bfloat16x8_t __s1_792 = __p1_792; \ 68254 bfloat16x4_t __s2_792 = __p2_792; \ 68255 __ret_792 = vbfdotq_f32(__s0_792, __s1_792, __builtin_bit_cast(bfloat16x8_t, splatq_lane_f32(__builtin_bit_cast(float32x2_t, __s2_792), __p3_792))); \ 68256 __ret_792; \ 68257 }) 68258 #else 68259 #define vbfdotq_lane_f32(__p0_793, __p1_793, __p2_793, __p3_793) __extension__ ({ \ 68260 float32x4_t __ret_793; \ 68261 float32x4_t __s0_793 = __p0_793; \ 68262 bfloat16x8_t __s1_793 = __p1_793; \ 68263 bfloat16x4_t __s2_793 = __p2_793; \ 68264 float32x4_t __rev0_793; __rev0_793 = __builtin_shufflevector(__s0_793, __s0_793, 3, 2, 1, 0); \ 68265 bfloat16x8_t __rev1_793; __rev1_793 = __builtin_shufflevector(__s1_793, __s1_793, 7, 6, 5, 4, 3, 2, 1, 0); \ 68266 bfloat16x4_t __rev2_793; __rev2_793 = __builtin_shufflevector(__s2_793, __s2_793, 3, 2, 1, 0); \ 68267 __ret_793 = __noswap_vbfdotq_f32(__rev0_793, __rev1_793, __builtin_bit_cast(bfloat16x8_t, __noswap_splatq_lane_f32(__builtin_bit_cast(float32x2_t, __rev2_793), __p3_793))); \ 68268 __ret_793 = __builtin_shufflevector(__ret_793, __ret_793, 3, 2, 1, 0); \ 68269 __ret_793; \ 68270 }) 68271 #endif 68272 68273 #ifdef __LITTLE_ENDIAN__ 68274 #define vbfdot_lane_f32(__p0_794, __p1_794, __p2_794, __p3_794) __extension__ ({ \ 68275 float32x2_t __ret_794; \ 68276 float32x2_t __s0_794 = __p0_794; \ 68277 bfloat16x4_t __s1_794 = __p1_794; \ 68278 bfloat16x4_t __s2_794 = __p2_794; \ 68279 __ret_794 = vbfdot_f32(__s0_794, __s1_794, __builtin_bit_cast(bfloat16x4_t, splat_lane_f32(__builtin_bit_cast(float32x2_t, __s2_794), __p3_794))); \ 68280 __ret_794; \ 68281 }) 68282 #else 68283 #define vbfdot_lane_f32(__p0_795, __p1_795, __p2_795, __p3_795) __extension__ ({ \ 68284 float32x2_t __ret_795; \ 68285 float32x2_t __s0_795 = __p0_795; \ 68286 bfloat16x4_t __s1_795 = __p1_795; \ 68287 bfloat16x4_t __s2_795 = __p2_795; \ 68288 float32x2_t __rev0_795; __rev0_795 = __builtin_shufflevector(__s0_795, __s0_795, 1, 0); \ 68289 bfloat16x4_t __rev1_795; __rev1_795 = __builtin_shufflevector(__s1_795, __s1_795, 3, 2, 1, 0); \ 68290 bfloat16x4_t __rev2_795; __rev2_795 = __builtin_shufflevector(__s2_795, __s2_795, 3, 2, 1, 0); \ 68291 __ret_795 = __noswap_vbfdot_f32(__rev0_795, __rev1_795, __builtin_bit_cast(bfloat16x4_t, __noswap_splat_lane_f32(__builtin_bit_cast(float32x2_t, __rev2_795), __p3_795))); \ 68292 __ret_795 = __builtin_shufflevector(__ret_795, __ret_795, 1, 0); \ 68293 __ret_795; \ 68294 }) 68295 #endif 68296 68297 #ifdef __LITTLE_ENDIAN__ 68298 #define vbfdotq_laneq_f32(__p0_796, __p1_796, __p2_796, __p3_796) __extension__ ({ \ 68299 float32x4_t __ret_796; \ 68300 float32x4_t __s0_796 = __p0_796; \ 68301 bfloat16x8_t __s1_796 = __p1_796; \ 68302 bfloat16x8_t __s2_796 = __p2_796; \ 68303 __ret_796 = vbfdotq_f32(__s0_796, __s1_796, __builtin_bit_cast(bfloat16x8_t, splatq_laneq_f32(__builtin_bit_cast(float32x4_t, __s2_796), __p3_796))); \ 68304 __ret_796; \ 68305 }) 68306 #else 68307 #define vbfdotq_laneq_f32(__p0_797, __p1_797, __p2_797, __p3_797) __extension__ ({ \ 68308 float32x4_t __ret_797; \ 68309 float32x4_t __s0_797 = __p0_797; \ 68310 bfloat16x8_t __s1_797 = __p1_797; \ 68311 bfloat16x8_t __s2_797 = __p2_797; \ 68312 float32x4_t __rev0_797; __rev0_797 = __builtin_shufflevector(__s0_797, __s0_797, 3, 2, 1, 0); \ 68313 bfloat16x8_t __rev1_797; __rev1_797 = __builtin_shufflevector(__s1_797, __s1_797, 7, 6, 5, 4, 3, 2, 1, 0); \ 68314 bfloat16x8_t __rev2_797; __rev2_797 = __builtin_shufflevector(__s2_797, __s2_797, 7, 6, 5, 4, 3, 2, 1, 0); \ 68315 __ret_797 = __noswap_vbfdotq_f32(__rev0_797, __rev1_797, __builtin_bit_cast(bfloat16x8_t, __noswap_splatq_laneq_f32(__builtin_bit_cast(float32x4_t, __rev2_797), __p3_797))); \ 68316 __ret_797 = __builtin_shufflevector(__ret_797, __ret_797, 3, 2, 1, 0); \ 68317 __ret_797; \ 68318 }) 68319 #endif 68320 68321 #ifdef __LITTLE_ENDIAN__ 68322 #define vbfdot_laneq_f32(__p0_798, __p1_798, __p2_798, __p3_798) __extension__ ({ \ 68323 float32x2_t __ret_798; \ 68324 float32x2_t __s0_798 = __p0_798; \ 68325 bfloat16x4_t __s1_798 = __p1_798; \ 68326 bfloat16x8_t __s2_798 = __p2_798; \ 68327 __ret_798 = vbfdot_f32(__s0_798, __s1_798, __builtin_bit_cast(bfloat16x4_t, splat_laneq_f32(__builtin_bit_cast(float32x4_t, __s2_798), __p3_798))); \ 68328 __ret_798; \ 68329 }) 68330 #else 68331 #define vbfdot_laneq_f32(__p0_799, __p1_799, __p2_799, __p3_799) __extension__ ({ \ 68332 float32x2_t __ret_799; \ 68333 float32x2_t __s0_799 = __p0_799; \ 68334 bfloat16x4_t __s1_799 = __p1_799; \ 68335 bfloat16x8_t __s2_799 = __p2_799; \ 68336 float32x2_t __rev0_799; __rev0_799 = __builtin_shufflevector(__s0_799, __s0_799, 1, 0); \ 68337 bfloat16x4_t __rev1_799; __rev1_799 = __builtin_shufflevector(__s1_799, __s1_799, 3, 2, 1, 0); \ 68338 bfloat16x8_t __rev2_799; __rev2_799 = __builtin_shufflevector(__s2_799, __s2_799, 7, 6, 5, 4, 3, 2, 1, 0); \ 68339 __ret_799 = __noswap_vbfdot_f32(__rev0_799, __rev1_799, __builtin_bit_cast(bfloat16x4_t, __noswap_splat_laneq_f32(__builtin_bit_cast(float32x4_t, __rev2_799), __p3_799))); \ 68340 __ret_799 = __builtin_shufflevector(__ret_799, __ret_799, 1, 0); \ 68341 __ret_799; \ 68342 }) 68343 #endif 68344 68345 #ifdef __LITTLE_ENDIAN__ 68346 #define vbfmlalbq_lane_f32(__p0_800, __p1_800, __p2_800, __p3_800) __extension__ ({ \ 68347 float32x4_t __ret_800; \ 68348 float32x4_t __s0_800 = __p0_800; \ 68349 bfloat16x8_t __s1_800 = __p1_800; \ 68350 bfloat16x4_t __s2_800 = __p2_800; \ 68351 __ret_800 = vbfmlalbq_f32(__s0_800, __s1_800, (bfloat16x8_t) {vget_lane_bf16(__s2_800, __p3_800), vget_lane_bf16(__s2_800, __p3_800), vget_lane_bf16(__s2_800, __p3_800), vget_lane_bf16(__s2_800, __p3_800), vget_lane_bf16(__s2_800, __p3_800), vget_lane_bf16(__s2_800, __p3_800), vget_lane_bf16(__s2_800, __p3_800), vget_lane_bf16(__s2_800, __p3_800)}); \ 68352 __ret_800; \ 68353 }) 68354 #else 68355 #define vbfmlalbq_lane_f32(__p0_801, __p1_801, __p2_801, __p3_801) __extension__ ({ \ 68356 float32x4_t __ret_801; \ 68357 float32x4_t __s0_801 = __p0_801; \ 68358 bfloat16x8_t __s1_801 = __p1_801; \ 68359 bfloat16x4_t __s2_801 = __p2_801; \ 68360 float32x4_t __rev0_801; __rev0_801 = __builtin_shufflevector(__s0_801, __s0_801, 3, 2, 1, 0); \ 68361 bfloat16x8_t __rev1_801; __rev1_801 = __builtin_shufflevector(__s1_801, __s1_801, 7, 6, 5, 4, 3, 2, 1, 0); \ 68362 bfloat16x4_t __rev2_801; __rev2_801 = __builtin_shufflevector(__s2_801, __s2_801, 3, 2, 1, 0); \ 68363 __ret_801 = __noswap_vbfmlalbq_f32(__rev0_801, __rev1_801, (bfloat16x8_t) {__noswap_vget_lane_bf16(__rev2_801, __p3_801), __noswap_vget_lane_bf16(__rev2_801, __p3_801), __noswap_vget_lane_bf16(__rev2_801, __p3_801), __noswap_vget_lane_bf16(__rev2_801, __p3_801), __noswap_vget_lane_bf16(__rev2_801, __p3_801), __noswap_vget_lane_bf16(__rev2_801, __p3_801), __noswap_vget_lane_bf16(__rev2_801, __p3_801), __noswap_vget_lane_bf16(__rev2_801, __p3_801)}); \ 68364 __ret_801 = __builtin_shufflevector(__ret_801, __ret_801, 3, 2, 1, 0); \ 68365 __ret_801; \ 68366 }) 68367 #endif 68368 68369 #ifdef __LITTLE_ENDIAN__ 68370 #define vbfmlalbq_laneq_f32(__p0_802, __p1_802, __p2_802, __p3_802) __extension__ ({ \ 68371 float32x4_t __ret_802; \ 68372 float32x4_t __s0_802 = __p0_802; \ 68373 bfloat16x8_t __s1_802 = __p1_802; \ 68374 bfloat16x8_t __s2_802 = __p2_802; \ 68375 __ret_802 = vbfmlalbq_f32(__s0_802, __s1_802, (bfloat16x8_t) {vgetq_lane_bf16(__s2_802, __p3_802), vgetq_lane_bf16(__s2_802, __p3_802), vgetq_lane_bf16(__s2_802, __p3_802), vgetq_lane_bf16(__s2_802, __p3_802), vgetq_lane_bf16(__s2_802, __p3_802), vgetq_lane_bf16(__s2_802, __p3_802), vgetq_lane_bf16(__s2_802, __p3_802), vgetq_lane_bf16(__s2_802, __p3_802)}); \ 68376 __ret_802; \ 68377 }) 68378 #else 68379 #define vbfmlalbq_laneq_f32(__p0_803, __p1_803, __p2_803, __p3_803) __extension__ ({ \ 68380 float32x4_t __ret_803; \ 68381 float32x4_t __s0_803 = __p0_803; \ 68382 bfloat16x8_t __s1_803 = __p1_803; \ 68383 bfloat16x8_t __s2_803 = __p2_803; \ 68384 float32x4_t __rev0_803; __rev0_803 = __builtin_shufflevector(__s0_803, __s0_803, 3, 2, 1, 0); \ 68385 bfloat16x8_t __rev1_803; __rev1_803 = __builtin_shufflevector(__s1_803, __s1_803, 7, 6, 5, 4, 3, 2, 1, 0); \ 68386 bfloat16x8_t __rev2_803; __rev2_803 = __builtin_shufflevector(__s2_803, __s2_803, 7, 6, 5, 4, 3, 2, 1, 0); \ 68387 __ret_803 = __noswap_vbfmlalbq_f32(__rev0_803, __rev1_803, (bfloat16x8_t) {__noswap_vgetq_lane_bf16(__rev2_803, __p3_803), __noswap_vgetq_lane_bf16(__rev2_803, __p3_803), __noswap_vgetq_lane_bf16(__rev2_803, __p3_803), __noswap_vgetq_lane_bf16(__rev2_803, __p3_803), __noswap_vgetq_lane_bf16(__rev2_803, __p3_803), __noswap_vgetq_lane_bf16(__rev2_803, __p3_803), __noswap_vgetq_lane_bf16(__rev2_803, __p3_803), __noswap_vgetq_lane_bf16(__rev2_803, __p3_803)}); \ 68388 __ret_803 = __builtin_shufflevector(__ret_803, __ret_803, 3, 2, 1, 0); \ 68389 __ret_803; \ 68390 }) 68391 #endif 68392 68393 #ifdef __LITTLE_ENDIAN__ 68394 #define vbfmlaltq_lane_f32(__p0_804, __p1_804, __p2_804, __p3_804) __extension__ ({ \ 68395 float32x4_t __ret_804; \ 68396 float32x4_t __s0_804 = __p0_804; \ 68397 bfloat16x8_t __s1_804 = __p1_804; \ 68398 bfloat16x4_t __s2_804 = __p2_804; \ 68399 __ret_804 = vbfmlaltq_f32(__s0_804, __s1_804, (bfloat16x8_t) {vget_lane_bf16(__s2_804, __p3_804), vget_lane_bf16(__s2_804, __p3_804), vget_lane_bf16(__s2_804, __p3_804), vget_lane_bf16(__s2_804, __p3_804), vget_lane_bf16(__s2_804, __p3_804), vget_lane_bf16(__s2_804, __p3_804), vget_lane_bf16(__s2_804, __p3_804), vget_lane_bf16(__s2_804, __p3_804)}); \ 68400 __ret_804; \ 68401 }) 68402 #else 68403 #define vbfmlaltq_lane_f32(__p0_805, __p1_805, __p2_805, __p3_805) __extension__ ({ \ 68404 float32x4_t __ret_805; \ 68405 float32x4_t __s0_805 = __p0_805; \ 68406 bfloat16x8_t __s1_805 = __p1_805; \ 68407 bfloat16x4_t __s2_805 = __p2_805; \ 68408 float32x4_t __rev0_805; __rev0_805 = __builtin_shufflevector(__s0_805, __s0_805, 3, 2, 1, 0); \ 68409 bfloat16x8_t __rev1_805; __rev1_805 = __builtin_shufflevector(__s1_805, __s1_805, 7, 6, 5, 4, 3, 2, 1, 0); \ 68410 bfloat16x4_t __rev2_805; __rev2_805 = __builtin_shufflevector(__s2_805, __s2_805, 3, 2, 1, 0); \ 68411 __ret_805 = __noswap_vbfmlaltq_f32(__rev0_805, __rev1_805, (bfloat16x8_t) {__noswap_vget_lane_bf16(__rev2_805, __p3_805), __noswap_vget_lane_bf16(__rev2_805, __p3_805), __noswap_vget_lane_bf16(__rev2_805, __p3_805), __noswap_vget_lane_bf16(__rev2_805, __p3_805), __noswap_vget_lane_bf16(__rev2_805, __p3_805), __noswap_vget_lane_bf16(__rev2_805, __p3_805), __noswap_vget_lane_bf16(__rev2_805, __p3_805), __noswap_vget_lane_bf16(__rev2_805, __p3_805)}); \ 68412 __ret_805 = __builtin_shufflevector(__ret_805, __ret_805, 3, 2, 1, 0); \ 68413 __ret_805; \ 68414 }) 68415 #endif 68416 68417 #ifdef __LITTLE_ENDIAN__ 68418 #define vbfmlaltq_laneq_f32(__p0_806, __p1_806, __p2_806, __p3_806) __extension__ ({ \ 68419 float32x4_t __ret_806; \ 68420 float32x4_t __s0_806 = __p0_806; \ 68421 bfloat16x8_t __s1_806 = __p1_806; \ 68422 bfloat16x8_t __s2_806 = __p2_806; \ 68423 __ret_806 = vbfmlaltq_f32(__s0_806, __s1_806, (bfloat16x8_t) {vgetq_lane_bf16(__s2_806, __p3_806), vgetq_lane_bf16(__s2_806, __p3_806), vgetq_lane_bf16(__s2_806, __p3_806), vgetq_lane_bf16(__s2_806, __p3_806), vgetq_lane_bf16(__s2_806, __p3_806), vgetq_lane_bf16(__s2_806, __p3_806), vgetq_lane_bf16(__s2_806, __p3_806), vgetq_lane_bf16(__s2_806, __p3_806)}); \ 68424 __ret_806; \ 68425 }) 68426 #else 68427 #define vbfmlaltq_laneq_f32(__p0_807, __p1_807, __p2_807, __p3_807) __extension__ ({ \ 68428 float32x4_t __ret_807; \ 68429 float32x4_t __s0_807 = __p0_807; \ 68430 bfloat16x8_t __s1_807 = __p1_807; \ 68431 bfloat16x8_t __s2_807 = __p2_807; \ 68432 float32x4_t __rev0_807; __rev0_807 = __builtin_shufflevector(__s0_807, __s0_807, 3, 2, 1, 0); \ 68433 bfloat16x8_t __rev1_807; __rev1_807 = __builtin_shufflevector(__s1_807, __s1_807, 7, 6, 5, 4, 3, 2, 1, 0); \ 68434 bfloat16x8_t __rev2_807; __rev2_807 = __builtin_shufflevector(__s2_807, __s2_807, 7, 6, 5, 4, 3, 2, 1, 0); \ 68435 __ret_807 = __noswap_vbfmlaltq_f32(__rev0_807, __rev1_807, (bfloat16x8_t) {__noswap_vgetq_lane_bf16(__rev2_807, __p3_807), __noswap_vgetq_lane_bf16(__rev2_807, __p3_807), __noswap_vgetq_lane_bf16(__rev2_807, __p3_807), __noswap_vgetq_lane_bf16(__rev2_807, __p3_807), __noswap_vgetq_lane_bf16(__rev2_807, __p3_807), __noswap_vgetq_lane_bf16(__rev2_807, __p3_807), __noswap_vgetq_lane_bf16(__rev2_807, __p3_807), __noswap_vgetq_lane_bf16(__rev2_807, __p3_807)}); \ 68436 __ret_807 = __builtin_shufflevector(__ret_807, __ret_807, 3, 2, 1, 0); \ 68437 __ret_807; \ 68438 }) 68439 #endif 68440 68441 #ifdef __LITTLE_ENDIAN__ 68442 __ai __attribute__((target("bf16,neon"))) float32x4_t vcvt_f32_bf16(bfloat16x4_t __p0_808) { 68443 float32x4_t __ret_808; 68444 __ret_808 = __builtin_bit_cast(float32x4_t, vshll_n_u16(__builtin_bit_cast(uint16x4_t, __p0_808), 16)); 68445 return __ret_808; 68446 } 68447 #else 68448 __ai __attribute__((target("bf16,neon"))) float32x4_t vcvt_f32_bf16(bfloat16x4_t __p0_809) { 68449 float32x4_t __ret_809; 68450 bfloat16x4_t __rev0_809; __rev0_809 = __builtin_shufflevector(__p0_809, __p0_809, 3, 2, 1, 0); 68451 __ret_809 = __builtin_bit_cast(float32x4_t, __noswap_vshll_n_u16(__builtin_bit_cast(uint16x4_t, __rev0_809), 16)); 68452 __ret_809 = __builtin_shufflevector(__ret_809, __ret_809, 3, 2, 1, 0); 68453 return __ret_809; 68454 } 68455 __ai __attribute__((target("bf16,neon"))) float32x4_t __noswap_vcvt_f32_bf16(bfloat16x4_t __p0_810) { 68456 float32x4_t __ret_810; 68457 __ret_810 = __builtin_bit_cast(float32x4_t, __noswap_vshll_n_u16(__builtin_bit_cast(uint16x4_t, __p0_810), 16)); 68458 return __ret_810; 68459 } 68460 #endif 68461 68462 #ifdef __LITTLE_ENDIAN__ 68463 __ai __attribute__((target("bf16,neon"))) float32x4_t vcvtq_high_f32_bf16(bfloat16x8_t __p0) { 68464 float32x4_t __ret; 68465 __ret = vcvt_f32_bf16(vget_high_bf16(__p0)); 68466 return __ret; 68467 } 68468 #else 68469 __ai __attribute__((target("bf16,neon"))) float32x4_t vcvtq_high_f32_bf16(bfloat16x8_t __p0) { 68470 float32x4_t __ret; 68471 bfloat16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 68472 __ret = __noswap_vcvt_f32_bf16(__noswap_vget_high_bf16(__rev0)); 68473 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 68474 return __ret; 68475 } 68476 #endif 68477 68478 #ifdef __LITTLE_ENDIAN__ 68479 __ai __attribute__((target("bf16,neon"))) float32x4_t vcvtq_low_f32_bf16(bfloat16x8_t __p0) { 68480 float32x4_t __ret; 68481 __ret = vcvt_f32_bf16(vget_low_bf16(__p0)); 68482 return __ret; 68483 } 68484 #else 68485 __ai __attribute__((target("bf16,neon"))) float32x4_t vcvtq_low_f32_bf16(bfloat16x8_t __p0) { 68486 float32x4_t __ret; 68487 bfloat16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 68488 __ret = __noswap_vcvt_f32_bf16(__noswap_vget_low_bf16(__rev0)); 68489 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 68490 return __ret; 68491 } 68492 #endif 68493 68494 #ifdef __LITTLE_ENDIAN__ 68495 #define vdotq_lane_u32(__p0_811, __p1_811, __p2_811, __p3_811) __extension__ ({ \ 68496 uint32x4_t __ret_811; \ 68497 uint32x4_t __s0_811 = __p0_811; \ 68498 uint8x16_t __s1_811 = __p1_811; \ 68499 uint8x8_t __s2_811 = __p2_811; \ 68500 __ret_811 = vdotq_u32(__s0_811, __s1_811, __builtin_bit_cast(uint8x16_t, splatq_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_811), __p3_811))); \ 68501 __ret_811; \ 68502 }) 68503 #else 68504 #define vdotq_lane_u32(__p0_812, __p1_812, __p2_812, __p3_812) __extension__ ({ \ 68505 uint32x4_t __ret_812; \ 68506 uint32x4_t __s0_812 = __p0_812; \ 68507 uint8x16_t __s1_812 = __p1_812; \ 68508 uint8x8_t __s2_812 = __p2_812; \ 68509 uint32x4_t __rev0_812; __rev0_812 = __builtin_shufflevector(__s0_812, __s0_812, 3, 2, 1, 0); \ 68510 uint8x16_t __rev1_812; __rev1_812 = __builtin_shufflevector(__s1_812, __s1_812, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 68511 uint8x8_t __rev2_812; __rev2_812 = __builtin_shufflevector(__s2_812, __s2_812, 7, 6, 5, 4, 3, 2, 1, 0); \ 68512 __ret_812 = __noswap_vdotq_u32(__rev0_812, __rev1_812, __builtin_bit_cast(uint8x16_t, __noswap_splatq_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_812), __p3_812))); \ 68513 __ret_812 = __builtin_shufflevector(__ret_812, __ret_812, 3, 2, 1, 0); \ 68514 __ret_812; \ 68515 }) 68516 #endif 68517 68518 #ifdef __LITTLE_ENDIAN__ 68519 #define vdotq_lane_s32(__p0_813, __p1_813, __p2_813, __p3_813) __extension__ ({ \ 68520 int32x4_t __ret_813; \ 68521 int32x4_t __s0_813 = __p0_813; \ 68522 int8x16_t __s1_813 = __p1_813; \ 68523 int8x8_t __s2_813 = __p2_813; \ 68524 __ret_813 = vdotq_s32(__s0_813, __s1_813, __builtin_bit_cast(int8x16_t, splatq_lane_s32(__builtin_bit_cast(int32x2_t, __s2_813), __p3_813))); \ 68525 __ret_813; \ 68526 }) 68527 #else 68528 #define vdotq_lane_s32(__p0_814, __p1_814, __p2_814, __p3_814) __extension__ ({ \ 68529 int32x4_t __ret_814; \ 68530 int32x4_t __s0_814 = __p0_814; \ 68531 int8x16_t __s1_814 = __p1_814; \ 68532 int8x8_t __s2_814 = __p2_814; \ 68533 int32x4_t __rev0_814; __rev0_814 = __builtin_shufflevector(__s0_814, __s0_814, 3, 2, 1, 0); \ 68534 int8x16_t __rev1_814; __rev1_814 = __builtin_shufflevector(__s1_814, __s1_814, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 68535 int8x8_t __rev2_814; __rev2_814 = __builtin_shufflevector(__s2_814, __s2_814, 7, 6, 5, 4, 3, 2, 1, 0); \ 68536 __ret_814 = __noswap_vdotq_s32(__rev0_814, __rev1_814, __builtin_bit_cast(int8x16_t, __noswap_splatq_lane_s32(__builtin_bit_cast(int32x2_t, __rev2_814), __p3_814))); \ 68537 __ret_814 = __builtin_shufflevector(__ret_814, __ret_814, 3, 2, 1, 0); \ 68538 __ret_814; \ 68539 }) 68540 #endif 68541 68542 #ifdef __LITTLE_ENDIAN__ 68543 #define vdot_lane_u32(__p0_815, __p1_815, __p2_815, __p3_815) __extension__ ({ \ 68544 uint32x2_t __ret_815; \ 68545 uint32x2_t __s0_815 = __p0_815; \ 68546 uint8x8_t __s1_815 = __p1_815; \ 68547 uint8x8_t __s2_815 = __p2_815; \ 68548 __ret_815 = vdot_u32(__s0_815, __s1_815, __builtin_bit_cast(uint8x8_t, splat_lane_u32(__builtin_bit_cast(uint32x2_t, __s2_815), __p3_815))); \ 68549 __ret_815; \ 68550 }) 68551 #else 68552 #define vdot_lane_u32(__p0_816, __p1_816, __p2_816, __p3_816) __extension__ ({ \ 68553 uint32x2_t __ret_816; \ 68554 uint32x2_t __s0_816 = __p0_816; \ 68555 uint8x8_t __s1_816 = __p1_816; \ 68556 uint8x8_t __s2_816 = __p2_816; \ 68557 uint32x2_t __rev0_816; __rev0_816 = __builtin_shufflevector(__s0_816, __s0_816, 1, 0); \ 68558 uint8x8_t __rev1_816; __rev1_816 = __builtin_shufflevector(__s1_816, __s1_816, 7, 6, 5, 4, 3, 2, 1, 0); \ 68559 uint8x8_t __rev2_816; __rev2_816 = __builtin_shufflevector(__s2_816, __s2_816, 7, 6, 5, 4, 3, 2, 1, 0); \ 68560 __ret_816 = __noswap_vdot_u32(__rev0_816, __rev1_816, __builtin_bit_cast(uint8x8_t, __noswap_splat_lane_u32(__builtin_bit_cast(uint32x2_t, __rev2_816), __p3_816))); \ 68561 __ret_816 = __builtin_shufflevector(__ret_816, __ret_816, 1, 0); \ 68562 __ret_816; \ 68563 }) 68564 #endif 68565 68566 #ifdef __LITTLE_ENDIAN__ 68567 #define vdot_lane_s32(__p0_817, __p1_817, __p2_817, __p3_817) __extension__ ({ \ 68568 int32x2_t __ret_817; \ 68569 int32x2_t __s0_817 = __p0_817; \ 68570 int8x8_t __s1_817 = __p1_817; \ 68571 int8x8_t __s2_817 = __p2_817; \ 68572 __ret_817 = vdot_s32(__s0_817, __s1_817, __builtin_bit_cast(int8x8_t, splat_lane_s32(__builtin_bit_cast(int32x2_t, __s2_817), __p3_817))); \ 68573 __ret_817; \ 68574 }) 68575 #else 68576 #define vdot_lane_s32(__p0_818, __p1_818, __p2_818, __p3_818) __extension__ ({ \ 68577 int32x2_t __ret_818; \ 68578 int32x2_t __s0_818 = __p0_818; \ 68579 int8x8_t __s1_818 = __p1_818; \ 68580 int8x8_t __s2_818 = __p2_818; \ 68581 int32x2_t __rev0_818; __rev0_818 = __builtin_shufflevector(__s0_818, __s0_818, 1, 0); \ 68582 int8x8_t __rev1_818; __rev1_818 = __builtin_shufflevector(__s1_818, __s1_818, 7, 6, 5, 4, 3, 2, 1, 0); \ 68583 int8x8_t __rev2_818; __rev2_818 = __builtin_shufflevector(__s2_818, __s2_818, 7, 6, 5, 4, 3, 2, 1, 0); \ 68584 __ret_818 = __noswap_vdot_s32(__rev0_818, __rev1_818, __builtin_bit_cast(int8x8_t, __noswap_splat_lane_s32(__builtin_bit_cast(int32x2_t, __rev2_818), __p3_818))); \ 68585 __ret_818 = __builtin_shufflevector(__ret_818, __ret_818, 1, 0); \ 68586 __ret_818; \ 68587 }) 68588 #endif 68589 68590 #ifdef __LITTLE_ENDIAN__ 68591 #define vmulq_lane_f16(__p0_819, __p1_819, __p2_819) __extension__ ({ \ 68592 float16x8_t __ret_819; \ 68593 float16x8_t __s0_819 = __p0_819; \ 68594 float16x4_t __s1_819 = __p1_819; \ 68595 __ret_819 = __s0_819 * splatq_lane_f16(__s1_819, __p2_819); \ 68596 __ret_819; \ 68597 }) 68598 #else 68599 #define vmulq_lane_f16(__p0_820, __p1_820, __p2_820) __extension__ ({ \ 68600 float16x8_t __ret_820; \ 68601 float16x8_t __s0_820 = __p0_820; \ 68602 float16x4_t __s1_820 = __p1_820; \ 68603 float16x8_t __rev0_820; __rev0_820 = __builtin_shufflevector(__s0_820, __s0_820, 7, 6, 5, 4, 3, 2, 1, 0); \ 68604 float16x4_t __rev1_820; __rev1_820 = __builtin_shufflevector(__s1_820, __s1_820, 3, 2, 1, 0); \ 68605 __ret_820 = __rev0_820 * __noswap_splatq_lane_f16(__rev1_820, __p2_820); \ 68606 __ret_820 = __builtin_shufflevector(__ret_820, __ret_820, 7, 6, 5, 4, 3, 2, 1, 0); \ 68607 __ret_820; \ 68608 }) 68609 #endif 68610 68611 #ifdef __LITTLE_ENDIAN__ 68612 #define vmul_lane_f16(__p0_821, __p1_821, __p2_821) __extension__ ({ \ 68613 float16x4_t __ret_821; \ 68614 float16x4_t __s0_821 = __p0_821; \ 68615 float16x4_t __s1_821 = __p1_821; \ 68616 __ret_821 = __s0_821 * splat_lane_f16(__s1_821, __p2_821); \ 68617 __ret_821; \ 68618 }) 68619 #else 68620 #define vmul_lane_f16(__p0_822, __p1_822, __p2_822) __extension__ ({ \ 68621 float16x4_t __ret_822; \ 68622 float16x4_t __s0_822 = __p0_822; \ 68623 float16x4_t __s1_822 = __p1_822; \ 68624 float16x4_t __rev0_822; __rev0_822 = __builtin_shufflevector(__s0_822, __s0_822, 3, 2, 1, 0); \ 68625 float16x4_t __rev1_822; __rev1_822 = __builtin_shufflevector(__s1_822, __s1_822, 3, 2, 1, 0); \ 68626 __ret_822 = __rev0_822 * __noswap_splat_lane_f16(__rev1_822, __p2_822); \ 68627 __ret_822 = __builtin_shufflevector(__ret_822, __ret_822, 3, 2, 1, 0); \ 68628 __ret_822; \ 68629 }) 68630 #endif 68631 68632 #ifdef __LITTLE_ENDIAN__ 68633 #define vsudotq_lane_s32(__p0_823, __p1_823, __p2_823, __p3_823) __extension__ ({ \ 68634 int32x4_t __ret_823; \ 68635 int32x4_t __s0_823 = __p0_823; \ 68636 int8x16_t __s1_823 = __p1_823; \ 68637 uint8x8_t __s2_823 = __p2_823; \ 68638 __ret_823 = vusdotq_s32(__s0_823, (uint8x16_t)(splatq_lane_s32(__builtin_bit_cast(int32x2_t, __s2_823), __p3_823)), __s1_823); \ 68639 __ret_823; \ 68640 }) 68641 #else 68642 #define vsudotq_lane_s32(__p0_824, __p1_824, __p2_824, __p3_824) __extension__ ({ \ 68643 int32x4_t __ret_824; \ 68644 int32x4_t __s0_824 = __p0_824; \ 68645 int8x16_t __s1_824 = __p1_824; \ 68646 uint8x8_t __s2_824 = __p2_824; \ 68647 int32x4_t __rev0_824; __rev0_824 = __builtin_shufflevector(__s0_824, __s0_824, 3, 2, 1, 0); \ 68648 int8x16_t __rev1_824; __rev1_824 = __builtin_shufflevector(__s1_824, __s1_824, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 68649 uint8x8_t __rev2_824; __rev2_824 = __builtin_shufflevector(__s2_824, __s2_824, 7, 6, 5, 4, 3, 2, 1, 0); \ 68650 __ret_824 = __noswap_vusdotq_s32(__rev0_824, (uint8x16_t)(__noswap_splatq_lane_s32(__builtin_bit_cast(int32x2_t, __rev2_824), __p3_824)), __rev1_824); \ 68651 __ret_824 = __builtin_shufflevector(__ret_824, __ret_824, 3, 2, 1, 0); \ 68652 __ret_824; \ 68653 }) 68654 #endif 68655 68656 #ifdef __LITTLE_ENDIAN__ 68657 #define vsudot_lane_s32(__p0_825, __p1_825, __p2_825, __p3_825) __extension__ ({ \ 68658 int32x2_t __ret_825; \ 68659 int32x2_t __s0_825 = __p0_825; \ 68660 int8x8_t __s1_825 = __p1_825; \ 68661 uint8x8_t __s2_825 = __p2_825; \ 68662 __ret_825 = vusdot_s32(__s0_825, (uint8x8_t)(splat_lane_s32(__builtin_bit_cast(int32x2_t, __s2_825), __p3_825)), __s1_825); \ 68663 __ret_825; \ 68664 }) 68665 #else 68666 #define vsudot_lane_s32(__p0_826, __p1_826, __p2_826, __p3_826) __extension__ ({ \ 68667 int32x2_t __ret_826; \ 68668 int32x2_t __s0_826 = __p0_826; \ 68669 int8x8_t __s1_826 = __p1_826; \ 68670 uint8x8_t __s2_826 = __p2_826; \ 68671 int32x2_t __rev0_826; __rev0_826 = __builtin_shufflevector(__s0_826, __s0_826, 1, 0); \ 68672 int8x8_t __rev1_826; __rev1_826 = __builtin_shufflevector(__s1_826, __s1_826, 7, 6, 5, 4, 3, 2, 1, 0); \ 68673 uint8x8_t __rev2_826; __rev2_826 = __builtin_shufflevector(__s2_826, __s2_826, 7, 6, 5, 4, 3, 2, 1, 0); \ 68674 __ret_826 = __noswap_vusdot_s32(__rev0_826, (uint8x8_t)(__noswap_splat_lane_s32(__builtin_bit_cast(int32x2_t, __rev2_826), __p3_826)), __rev1_826); \ 68675 __ret_826 = __builtin_shufflevector(__ret_826, __ret_826, 1, 0); \ 68676 __ret_826; \ 68677 }) 68678 #endif 68679 68680 #ifdef __LITTLE_ENDIAN__ 68681 #define vusdotq_lane_s32(__p0_827, __p1_827, __p2_827, __p3_827) __extension__ ({ \ 68682 int32x4_t __ret_827; \ 68683 int32x4_t __s0_827 = __p0_827; \ 68684 uint8x16_t __s1_827 = __p1_827; \ 68685 int8x8_t __s2_827 = __p2_827; \ 68686 __ret_827 = vusdotq_s32(__s0_827, __s1_827, (int8x16_t)(splatq_lane_s32(__builtin_bit_cast(int32x2_t, __s2_827), __p3_827))); \ 68687 __ret_827; \ 68688 }) 68689 #else 68690 #define vusdotq_lane_s32(__p0_828, __p1_828, __p2_828, __p3_828) __extension__ ({ \ 68691 int32x4_t __ret_828; \ 68692 int32x4_t __s0_828 = __p0_828; \ 68693 uint8x16_t __s1_828 = __p1_828; \ 68694 int8x8_t __s2_828 = __p2_828; \ 68695 int32x4_t __rev0_828; __rev0_828 = __builtin_shufflevector(__s0_828, __s0_828, 3, 2, 1, 0); \ 68696 uint8x16_t __rev1_828; __rev1_828 = __builtin_shufflevector(__s1_828, __s1_828, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); \ 68697 int8x8_t __rev2_828; __rev2_828 = __builtin_shufflevector(__s2_828, __s2_828, 7, 6, 5, 4, 3, 2, 1, 0); \ 68698 __ret_828 = __noswap_vusdotq_s32(__rev0_828, __rev1_828, (int8x16_t)(__noswap_splatq_lane_s32(__builtin_bit_cast(int32x2_t, __rev2_828), __p3_828))); \ 68699 __ret_828 = __builtin_shufflevector(__ret_828, __ret_828, 3, 2, 1, 0); \ 68700 __ret_828; \ 68701 }) 68702 #endif 68703 68704 #ifdef __LITTLE_ENDIAN__ 68705 #define vusdot_lane_s32(__p0_829, __p1_829, __p2_829, __p3_829) __extension__ ({ \ 68706 int32x2_t __ret_829; \ 68707 int32x2_t __s0_829 = __p0_829; \ 68708 uint8x8_t __s1_829 = __p1_829; \ 68709 int8x8_t __s2_829 = __p2_829; \ 68710 __ret_829 = vusdot_s32(__s0_829, __s1_829, (int8x8_t)(splat_lane_s32(__builtin_bit_cast(int32x2_t, __s2_829), __p3_829))); \ 68711 __ret_829; \ 68712 }) 68713 #else 68714 #define vusdot_lane_s32(__p0_830, __p1_830, __p2_830, __p3_830) __extension__ ({ \ 68715 int32x2_t __ret_830; \ 68716 int32x2_t __s0_830 = __p0_830; \ 68717 uint8x8_t __s1_830 = __p1_830; \ 68718 int8x8_t __s2_830 = __p2_830; \ 68719 int32x2_t __rev0_830; __rev0_830 = __builtin_shufflevector(__s0_830, __s0_830, 1, 0); \ 68720 uint8x8_t __rev1_830; __rev1_830 = __builtin_shufflevector(__s1_830, __s1_830, 7, 6, 5, 4, 3, 2, 1, 0); \ 68721 int8x8_t __rev2_830; __rev2_830 = __builtin_shufflevector(__s2_830, __s2_830, 7, 6, 5, 4, 3, 2, 1, 0); \ 68722 __ret_830 = __noswap_vusdot_s32(__rev0_830, __rev1_830, (int8x8_t)(__noswap_splat_lane_s32(__builtin_bit_cast(int32x2_t, __rev2_830), __p3_830))); \ 68723 __ret_830 = __builtin_shufflevector(__ret_830, __ret_830, 1, 0); \ 68724 __ret_830; \ 68725 }) 68726 #endif 68727 68728 #ifdef __LITTLE_ENDIAN__ 68729 __ai __attribute__((target("neon"))) uint8x16_t vabaq_u8(uint8x16_t __p0, uint8x16_t __p1, uint8x16_t __p2) { 68730 uint8x16_t __ret; 68731 __ret = __p0 + vabdq_u8(__p1, __p2); 68732 return __ret; 68733 } 68734 #else 68735 __ai __attribute__((target("neon"))) uint8x16_t vabaq_u8(uint8x16_t __p0, uint8x16_t __p1, uint8x16_t __p2) { 68736 uint8x16_t __ret; 68737 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 68738 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 68739 uint8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 68740 __ret = __rev0 + __noswap_vabdq_u8(__rev1, __rev2); 68741 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 68742 return __ret; 68743 } 68744 #endif 68745 68746 #ifdef __LITTLE_ENDIAN__ 68747 __ai __attribute__((target("neon"))) uint32x4_t vabaq_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 68748 uint32x4_t __ret; 68749 __ret = __p0 + vabdq_u32(__p1, __p2); 68750 return __ret; 68751 } 68752 #else 68753 __ai __attribute__((target("neon"))) uint32x4_t vabaq_u32(uint32x4_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 68754 uint32x4_t __ret; 68755 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 68756 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 68757 uint32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 68758 __ret = __rev0 + __noswap_vabdq_u32(__rev1, __rev2); 68759 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 68760 return __ret; 68761 } 68762 #endif 68763 68764 #ifdef __LITTLE_ENDIAN__ 68765 __ai __attribute__((target("neon"))) uint16x8_t vabaq_u16(uint16x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) { 68766 uint16x8_t __ret; 68767 __ret = __p0 + vabdq_u16(__p1, __p2); 68768 return __ret; 68769 } 68770 #else 68771 __ai __attribute__((target("neon"))) uint16x8_t vabaq_u16(uint16x8_t __p0, uint16x8_t __p1, uint16x8_t __p2) { 68772 uint16x8_t __ret; 68773 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 68774 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 68775 uint16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 68776 __ret = __rev0 + __noswap_vabdq_u16(__rev1, __rev2); 68777 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 68778 return __ret; 68779 } 68780 #endif 68781 68782 #ifdef __LITTLE_ENDIAN__ 68783 __ai __attribute__((target("neon"))) int8x16_t vabaq_s8(int8x16_t __p0, int8x16_t __p1, int8x16_t __p2) { 68784 int8x16_t __ret; 68785 __ret = __p0 + vabdq_s8(__p1, __p2); 68786 return __ret; 68787 } 68788 #else 68789 __ai __attribute__((target("neon"))) int8x16_t vabaq_s8(int8x16_t __p0, int8x16_t __p1, int8x16_t __p2) { 68790 int8x16_t __ret; 68791 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 68792 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 68793 int8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 68794 __ret = __rev0 + __noswap_vabdq_s8(__rev1, __rev2); 68795 __ret = __builtin_shufflevector(__ret, __ret, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 68796 return __ret; 68797 } 68798 #endif 68799 68800 #ifdef __LITTLE_ENDIAN__ 68801 __ai __attribute__((target("neon"))) int32x4_t vabaq_s32(int32x4_t __p0, int32x4_t __p1, int32x4_t __p2) { 68802 int32x4_t __ret; 68803 __ret = __p0 + vabdq_s32(__p1, __p2); 68804 return __ret; 68805 } 68806 #else 68807 __ai __attribute__((target("neon"))) int32x4_t vabaq_s32(int32x4_t __p0, int32x4_t __p1, int32x4_t __p2) { 68808 int32x4_t __ret; 68809 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 68810 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 68811 int32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 68812 __ret = __rev0 + __noswap_vabdq_s32(__rev1, __rev2); 68813 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 68814 return __ret; 68815 } 68816 #endif 68817 68818 #ifdef __LITTLE_ENDIAN__ 68819 __ai __attribute__((target("neon"))) int16x8_t vabaq_s16(int16x8_t __p0, int16x8_t __p1, int16x8_t __p2) { 68820 int16x8_t __ret; 68821 __ret = __p0 + vabdq_s16(__p1, __p2); 68822 return __ret; 68823 } 68824 #else 68825 __ai __attribute__((target("neon"))) int16x8_t vabaq_s16(int16x8_t __p0, int16x8_t __p1, int16x8_t __p2) { 68826 int16x8_t __ret; 68827 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 68828 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 68829 int16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 68830 __ret = __rev0 + __noswap_vabdq_s16(__rev1, __rev2); 68831 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 68832 return __ret; 68833 } 68834 #endif 68835 68836 #ifdef __LITTLE_ENDIAN__ 68837 __ai __attribute__((target("neon"))) uint8x8_t vaba_u8(uint8x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) { 68838 uint8x8_t __ret; 68839 __ret = __p0 + vabd_u8(__p1, __p2); 68840 return __ret; 68841 } 68842 #else 68843 __ai __attribute__((target("neon"))) uint8x8_t vaba_u8(uint8x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) { 68844 uint8x8_t __ret; 68845 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 68846 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 68847 uint8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 68848 __ret = __rev0 + __noswap_vabd_u8(__rev1, __rev2); 68849 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 68850 return __ret; 68851 } 68852 #endif 68853 68854 #ifdef __LITTLE_ENDIAN__ 68855 __ai __attribute__((target("neon"))) uint32x2_t vaba_u32(uint32x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) { 68856 uint32x2_t __ret; 68857 __ret = __p0 + vabd_u32(__p1, __p2); 68858 return __ret; 68859 } 68860 #else 68861 __ai __attribute__((target("neon"))) uint32x2_t vaba_u32(uint32x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) { 68862 uint32x2_t __ret; 68863 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 68864 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 68865 uint32x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 68866 __ret = __rev0 + __noswap_vabd_u32(__rev1, __rev2); 68867 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 68868 return __ret; 68869 } 68870 #endif 68871 68872 #ifdef __LITTLE_ENDIAN__ 68873 __ai __attribute__((target("neon"))) uint16x4_t vaba_u16(uint16x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) { 68874 uint16x4_t __ret; 68875 __ret = __p0 + vabd_u16(__p1, __p2); 68876 return __ret; 68877 } 68878 #else 68879 __ai __attribute__((target("neon"))) uint16x4_t vaba_u16(uint16x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) { 68880 uint16x4_t __ret; 68881 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 68882 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 68883 uint16x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 68884 __ret = __rev0 + __noswap_vabd_u16(__rev1, __rev2); 68885 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 68886 return __ret; 68887 } 68888 #endif 68889 68890 #ifdef __LITTLE_ENDIAN__ 68891 __ai __attribute__((target("neon"))) int8x8_t vaba_s8(int8x8_t __p0, int8x8_t __p1, int8x8_t __p2) { 68892 int8x8_t __ret; 68893 __ret = __p0 + vabd_s8(__p1, __p2); 68894 return __ret; 68895 } 68896 #else 68897 __ai __attribute__((target("neon"))) int8x8_t vaba_s8(int8x8_t __p0, int8x8_t __p1, int8x8_t __p2) { 68898 int8x8_t __ret; 68899 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 68900 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 68901 int8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 68902 __ret = __rev0 + __noswap_vabd_s8(__rev1, __rev2); 68903 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 68904 return __ret; 68905 } 68906 #endif 68907 68908 #ifdef __LITTLE_ENDIAN__ 68909 __ai __attribute__((target("neon"))) int32x2_t vaba_s32(int32x2_t __p0, int32x2_t __p1, int32x2_t __p2) { 68910 int32x2_t __ret; 68911 __ret = __p0 + vabd_s32(__p1, __p2); 68912 return __ret; 68913 } 68914 #else 68915 __ai __attribute__((target("neon"))) int32x2_t vaba_s32(int32x2_t __p0, int32x2_t __p1, int32x2_t __p2) { 68916 int32x2_t __ret; 68917 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 68918 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 68919 int32x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 68920 __ret = __rev0 + __noswap_vabd_s32(__rev1, __rev2); 68921 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 68922 return __ret; 68923 } 68924 #endif 68925 68926 #ifdef __LITTLE_ENDIAN__ 68927 __ai __attribute__((target("neon"))) int16x4_t vaba_s16(int16x4_t __p0, int16x4_t __p1, int16x4_t __p2) { 68928 int16x4_t __ret; 68929 __ret = __p0 + vabd_s16(__p1, __p2); 68930 return __ret; 68931 } 68932 #else 68933 __ai __attribute__((target("neon"))) int16x4_t vaba_s16(int16x4_t __p0, int16x4_t __p1, int16x4_t __p2) { 68934 int16x4_t __ret; 68935 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 68936 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 68937 int16x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 68938 __ret = __rev0 + __noswap_vabd_s16(__rev1, __rev2); 68939 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 68940 return __ret; 68941 } 68942 #endif 68943 68944 #ifdef __LITTLE_ENDIAN__ 68945 __ai __attribute__((target("neon"))) uint16x8_t vabdl_u8(uint8x8_t __p0, uint8x8_t __p1) { 68946 uint16x8_t __ret; 68947 __ret = (uint16x8_t)(vmovl_u8((uint8x8_t)(vabd_u8(__p0, __p1)))); 68948 return __ret; 68949 } 68950 #else 68951 __ai __attribute__((target("neon"))) uint16x8_t vabdl_u8(uint8x8_t __p0, uint8x8_t __p1) { 68952 uint16x8_t __ret; 68953 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 68954 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 68955 __ret = (uint16x8_t)(__noswap_vmovl_u8((uint8x8_t)(__noswap_vabd_u8(__rev0, __rev1)))); 68956 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 68957 return __ret; 68958 } 68959 __ai __attribute__((target("neon"))) uint16x8_t __noswap_vabdl_u8(uint8x8_t __p0, uint8x8_t __p1) { 68960 uint16x8_t __ret; 68961 __ret = (uint16x8_t)(__noswap_vmovl_u8((uint8x8_t)(__noswap_vabd_u8(__p0, __p1)))); 68962 return __ret; 68963 } 68964 #endif 68965 68966 #ifdef __LITTLE_ENDIAN__ 68967 __ai __attribute__((target("neon"))) uint64x2_t vabdl_u32(uint32x2_t __p0, uint32x2_t __p1) { 68968 uint64x2_t __ret; 68969 __ret = (uint64x2_t)(vmovl_u32((uint32x2_t)(vabd_u32(__p0, __p1)))); 68970 return __ret; 68971 } 68972 #else 68973 __ai __attribute__((target("neon"))) uint64x2_t vabdl_u32(uint32x2_t __p0, uint32x2_t __p1) { 68974 uint64x2_t __ret; 68975 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 68976 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 68977 __ret = (uint64x2_t)(__noswap_vmovl_u32((uint32x2_t)(__noswap_vabd_u32(__rev0, __rev1)))); 68978 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 68979 return __ret; 68980 } 68981 __ai __attribute__((target("neon"))) uint64x2_t __noswap_vabdl_u32(uint32x2_t __p0, uint32x2_t __p1) { 68982 uint64x2_t __ret; 68983 __ret = (uint64x2_t)(__noswap_vmovl_u32((uint32x2_t)(__noswap_vabd_u32(__p0, __p1)))); 68984 return __ret; 68985 } 68986 #endif 68987 68988 #ifdef __LITTLE_ENDIAN__ 68989 __ai __attribute__((target("neon"))) uint32x4_t vabdl_u16(uint16x4_t __p0, uint16x4_t __p1) { 68990 uint32x4_t __ret; 68991 __ret = (uint32x4_t)(vmovl_u16((uint16x4_t)(vabd_u16(__p0, __p1)))); 68992 return __ret; 68993 } 68994 #else 68995 __ai __attribute__((target("neon"))) uint32x4_t vabdl_u16(uint16x4_t __p0, uint16x4_t __p1) { 68996 uint32x4_t __ret; 68997 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 68998 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 68999 __ret = (uint32x4_t)(__noswap_vmovl_u16((uint16x4_t)(__noswap_vabd_u16(__rev0, __rev1)))); 69000 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 69001 return __ret; 69002 } 69003 __ai __attribute__((target("neon"))) uint32x4_t __noswap_vabdl_u16(uint16x4_t __p0, uint16x4_t __p1) { 69004 uint32x4_t __ret; 69005 __ret = (uint32x4_t)(__noswap_vmovl_u16((uint16x4_t)(__noswap_vabd_u16(__p0, __p1)))); 69006 return __ret; 69007 } 69008 #endif 69009 69010 #ifdef __LITTLE_ENDIAN__ 69011 __ai __attribute__((target("neon"))) int16x8_t vabdl_s8(int8x8_t __p0, int8x8_t __p1) { 69012 int16x8_t __ret; 69013 __ret = (int16x8_t)(vmovl_u8((uint8x8_t)(vabd_s8(__p0, __p1)))); 69014 return __ret; 69015 } 69016 #else 69017 __ai __attribute__((target("neon"))) int16x8_t vabdl_s8(int8x8_t __p0, int8x8_t __p1) { 69018 int16x8_t __ret; 69019 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 69020 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 69021 __ret = (int16x8_t)(__noswap_vmovl_u8((uint8x8_t)(__noswap_vabd_s8(__rev0, __rev1)))); 69022 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 69023 return __ret; 69024 } 69025 __ai __attribute__((target("neon"))) int16x8_t __noswap_vabdl_s8(int8x8_t __p0, int8x8_t __p1) { 69026 int16x8_t __ret; 69027 __ret = (int16x8_t)(__noswap_vmovl_u8((uint8x8_t)(__noswap_vabd_s8(__p0, __p1)))); 69028 return __ret; 69029 } 69030 #endif 69031 69032 #ifdef __LITTLE_ENDIAN__ 69033 __ai __attribute__((target("neon"))) int64x2_t vabdl_s32(int32x2_t __p0, int32x2_t __p1) { 69034 int64x2_t __ret; 69035 __ret = (int64x2_t)(vmovl_u32((uint32x2_t)(vabd_s32(__p0, __p1)))); 69036 return __ret; 69037 } 69038 #else 69039 __ai __attribute__((target("neon"))) int64x2_t vabdl_s32(int32x2_t __p0, int32x2_t __p1) { 69040 int64x2_t __ret; 69041 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 69042 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 69043 __ret = (int64x2_t)(__noswap_vmovl_u32((uint32x2_t)(__noswap_vabd_s32(__rev0, __rev1)))); 69044 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 69045 return __ret; 69046 } 69047 __ai __attribute__((target("neon"))) int64x2_t __noswap_vabdl_s32(int32x2_t __p0, int32x2_t __p1) { 69048 int64x2_t __ret; 69049 __ret = (int64x2_t)(__noswap_vmovl_u32((uint32x2_t)(__noswap_vabd_s32(__p0, __p1)))); 69050 return __ret; 69051 } 69052 #endif 69053 69054 #ifdef __LITTLE_ENDIAN__ 69055 __ai __attribute__((target("neon"))) int32x4_t vabdl_s16(int16x4_t __p0, int16x4_t __p1) { 69056 int32x4_t __ret; 69057 __ret = (int32x4_t)(vmovl_u16((uint16x4_t)(vabd_s16(__p0, __p1)))); 69058 return __ret; 69059 } 69060 #else 69061 __ai __attribute__((target("neon"))) int32x4_t vabdl_s16(int16x4_t __p0, int16x4_t __p1) { 69062 int32x4_t __ret; 69063 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 69064 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 69065 __ret = (int32x4_t)(__noswap_vmovl_u16((uint16x4_t)(__noswap_vabd_s16(__rev0, __rev1)))); 69066 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 69067 return __ret; 69068 } 69069 __ai __attribute__((target("neon"))) int32x4_t __noswap_vabdl_s16(int16x4_t __p0, int16x4_t __p1) { 69070 int32x4_t __ret; 69071 __ret = (int32x4_t)(__noswap_vmovl_u16((uint16x4_t)(__noswap_vabd_s16(__p0, __p1)))); 69072 return __ret; 69073 } 69074 #endif 69075 69076 #ifdef __LITTLE_ENDIAN__ 69077 __ai __attribute__((target("neon"))) uint16x8_t vaddl_u8(uint8x8_t __p0, uint8x8_t __p1) { 69078 uint16x8_t __ret; 69079 __ret = vmovl_u8(__p0) + vmovl_u8(__p1); 69080 return __ret; 69081 } 69082 #else 69083 __ai __attribute__((target("neon"))) uint16x8_t vaddl_u8(uint8x8_t __p0, uint8x8_t __p1) { 69084 uint16x8_t __ret; 69085 uint8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 69086 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 69087 __ret = __noswap_vmovl_u8(__rev0) + __noswap_vmovl_u8(__rev1); 69088 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 69089 return __ret; 69090 } 69091 #endif 69092 69093 #ifdef __LITTLE_ENDIAN__ 69094 __ai __attribute__((target("neon"))) uint64x2_t vaddl_u32(uint32x2_t __p0, uint32x2_t __p1) { 69095 uint64x2_t __ret; 69096 __ret = vmovl_u32(__p0) + vmovl_u32(__p1); 69097 return __ret; 69098 } 69099 #else 69100 __ai __attribute__((target("neon"))) uint64x2_t vaddl_u32(uint32x2_t __p0, uint32x2_t __p1) { 69101 uint64x2_t __ret; 69102 uint32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 69103 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 69104 __ret = __noswap_vmovl_u32(__rev0) + __noswap_vmovl_u32(__rev1); 69105 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 69106 return __ret; 69107 } 69108 #endif 69109 69110 #ifdef __LITTLE_ENDIAN__ 69111 __ai __attribute__((target("neon"))) uint32x4_t vaddl_u16(uint16x4_t __p0, uint16x4_t __p1) { 69112 uint32x4_t __ret; 69113 __ret = vmovl_u16(__p0) + vmovl_u16(__p1); 69114 return __ret; 69115 } 69116 #else 69117 __ai __attribute__((target("neon"))) uint32x4_t vaddl_u16(uint16x4_t __p0, uint16x4_t __p1) { 69118 uint32x4_t __ret; 69119 uint16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 69120 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 69121 __ret = __noswap_vmovl_u16(__rev0) + __noswap_vmovl_u16(__rev1); 69122 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 69123 return __ret; 69124 } 69125 #endif 69126 69127 #ifdef __LITTLE_ENDIAN__ 69128 __ai __attribute__((target("neon"))) int16x8_t vaddl_s8(int8x8_t __p0, int8x8_t __p1) { 69129 int16x8_t __ret; 69130 __ret = vmovl_s8(__p0) + vmovl_s8(__p1); 69131 return __ret; 69132 } 69133 #else 69134 __ai __attribute__((target("neon"))) int16x8_t vaddl_s8(int8x8_t __p0, int8x8_t __p1) { 69135 int16x8_t __ret; 69136 int8x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 69137 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 69138 __ret = __noswap_vmovl_s8(__rev0) + __noswap_vmovl_s8(__rev1); 69139 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 69140 return __ret; 69141 } 69142 #endif 69143 69144 #ifdef __LITTLE_ENDIAN__ 69145 __ai __attribute__((target("neon"))) int64x2_t vaddl_s32(int32x2_t __p0, int32x2_t __p1) { 69146 int64x2_t __ret; 69147 __ret = vmovl_s32(__p0) + vmovl_s32(__p1); 69148 return __ret; 69149 } 69150 #else 69151 __ai __attribute__((target("neon"))) int64x2_t vaddl_s32(int32x2_t __p0, int32x2_t __p1) { 69152 int64x2_t __ret; 69153 int32x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 69154 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 69155 __ret = __noswap_vmovl_s32(__rev0) + __noswap_vmovl_s32(__rev1); 69156 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 69157 return __ret; 69158 } 69159 #endif 69160 69161 #ifdef __LITTLE_ENDIAN__ 69162 __ai __attribute__((target("neon"))) int32x4_t vaddl_s16(int16x4_t __p0, int16x4_t __p1) { 69163 int32x4_t __ret; 69164 __ret = vmovl_s16(__p0) + vmovl_s16(__p1); 69165 return __ret; 69166 } 69167 #else 69168 __ai __attribute__((target("neon"))) int32x4_t vaddl_s16(int16x4_t __p0, int16x4_t __p1) { 69169 int32x4_t __ret; 69170 int16x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 69171 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 69172 __ret = __noswap_vmovl_s16(__rev0) + __noswap_vmovl_s16(__rev1); 69173 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 69174 return __ret; 69175 } 69176 #endif 69177 69178 #ifdef __LITTLE_ENDIAN__ 69179 __ai __attribute__((target("neon"))) uint16x8_t vaddw_u8(uint16x8_t __p0, uint8x8_t __p1) { 69180 uint16x8_t __ret; 69181 __ret = __p0 + vmovl_u8(__p1); 69182 return __ret; 69183 } 69184 #else 69185 __ai __attribute__((target("neon"))) uint16x8_t vaddw_u8(uint16x8_t __p0, uint8x8_t __p1) { 69186 uint16x8_t __ret; 69187 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 69188 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 69189 __ret = __rev0 + __noswap_vmovl_u8(__rev1); 69190 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 69191 return __ret; 69192 } 69193 #endif 69194 69195 #ifdef __LITTLE_ENDIAN__ 69196 __ai __attribute__((target("neon"))) uint64x2_t vaddw_u32(uint64x2_t __p0, uint32x2_t __p1) { 69197 uint64x2_t __ret; 69198 __ret = __p0 + vmovl_u32(__p1); 69199 return __ret; 69200 } 69201 #else 69202 __ai __attribute__((target("neon"))) uint64x2_t vaddw_u32(uint64x2_t __p0, uint32x2_t __p1) { 69203 uint64x2_t __ret; 69204 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 69205 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 69206 __ret = __rev0 + __noswap_vmovl_u32(__rev1); 69207 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 69208 return __ret; 69209 } 69210 #endif 69211 69212 #ifdef __LITTLE_ENDIAN__ 69213 __ai __attribute__((target("neon"))) uint32x4_t vaddw_u16(uint32x4_t __p0, uint16x4_t __p1) { 69214 uint32x4_t __ret; 69215 __ret = __p0 + vmovl_u16(__p1); 69216 return __ret; 69217 } 69218 #else 69219 __ai __attribute__((target("neon"))) uint32x4_t vaddw_u16(uint32x4_t __p0, uint16x4_t __p1) { 69220 uint32x4_t __ret; 69221 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 69222 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 69223 __ret = __rev0 + __noswap_vmovl_u16(__rev1); 69224 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 69225 return __ret; 69226 } 69227 #endif 69228 69229 #ifdef __LITTLE_ENDIAN__ 69230 __ai __attribute__((target("neon"))) int16x8_t vaddw_s8(int16x8_t __p0, int8x8_t __p1) { 69231 int16x8_t __ret; 69232 __ret = __p0 + vmovl_s8(__p1); 69233 return __ret; 69234 } 69235 #else 69236 __ai __attribute__((target("neon"))) int16x8_t vaddw_s8(int16x8_t __p0, int8x8_t __p1) { 69237 int16x8_t __ret; 69238 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 69239 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 69240 __ret = __rev0 + __noswap_vmovl_s8(__rev1); 69241 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 69242 return __ret; 69243 } 69244 #endif 69245 69246 #ifdef __LITTLE_ENDIAN__ 69247 __ai __attribute__((target("neon"))) int64x2_t vaddw_s32(int64x2_t __p0, int32x2_t __p1) { 69248 int64x2_t __ret; 69249 __ret = __p0 + vmovl_s32(__p1); 69250 return __ret; 69251 } 69252 #else 69253 __ai __attribute__((target("neon"))) int64x2_t vaddw_s32(int64x2_t __p0, int32x2_t __p1) { 69254 int64x2_t __ret; 69255 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 69256 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 69257 __ret = __rev0 + __noswap_vmovl_s32(__rev1); 69258 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 69259 return __ret; 69260 } 69261 #endif 69262 69263 #ifdef __LITTLE_ENDIAN__ 69264 __ai __attribute__((target("neon"))) int32x4_t vaddw_s16(int32x4_t __p0, int16x4_t __p1) { 69265 int32x4_t __ret; 69266 __ret = __p0 + vmovl_s16(__p1); 69267 return __ret; 69268 } 69269 #else 69270 __ai __attribute__((target("neon"))) int32x4_t vaddw_s16(int32x4_t __p0, int16x4_t __p1) { 69271 int32x4_t __ret; 69272 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 69273 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 69274 __ret = __rev0 + __noswap_vmovl_s16(__rev1); 69275 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 69276 return __ret; 69277 } 69278 #endif 69279 69280 #ifdef __LITTLE_ENDIAN__ 69281 #define vget_lane_f16(__p0_831, __p1_831) __extension__ ({ \ 69282 float16_t __ret_831; \ 69283 float16x4_t __s0_831 = __p0_831; \ 69284 __ret_831 = __builtin_bit_cast(float16_t, vget_lane_s16(__builtin_bit_cast(int16x4_t, __s0_831), __p1_831)); \ 69285 __ret_831; \ 69286 }) 69287 #else 69288 #define vget_lane_f16(__p0_832, __p1_832) __extension__ ({ \ 69289 float16_t __ret_832; \ 69290 float16x4_t __s0_832 = __p0_832; \ 69291 float16x4_t __rev0_832; __rev0_832 = __builtin_shufflevector(__s0_832, __s0_832, 3, 2, 1, 0); \ 69292 __ret_832 = __builtin_bit_cast(float16_t, __noswap_vget_lane_s16(__builtin_bit_cast(int16x4_t, __rev0_832), __p1_832)); \ 69293 __ret_832; \ 69294 }) 69295 #define __noswap_vget_lane_f16(__p0_833, __p1_833) __extension__ ({ \ 69296 float16_t __ret_833; \ 69297 float16x4_t __s0_833 = __p0_833; \ 69298 __ret_833 = __builtin_bit_cast(float16_t, __noswap_vget_lane_s16(__builtin_bit_cast(int16x4_t, __s0_833), __p1_833)); \ 69299 __ret_833; \ 69300 }) 69301 #endif 69302 69303 #ifdef __LITTLE_ENDIAN__ 69304 #define vgetq_lane_f16(__p0_834, __p1_834) __extension__ ({ \ 69305 float16_t __ret_834; \ 69306 float16x8_t __s0_834 = __p0_834; \ 69307 __ret_834 = __builtin_bit_cast(float16_t, vgetq_lane_s16(__builtin_bit_cast(int16x8_t, __s0_834), __p1_834)); \ 69308 __ret_834; \ 69309 }) 69310 #else 69311 #define vgetq_lane_f16(__p0_835, __p1_835) __extension__ ({ \ 69312 float16_t __ret_835; \ 69313 float16x8_t __s0_835 = __p0_835; \ 69314 float16x8_t __rev0_835; __rev0_835 = __builtin_shufflevector(__s0_835, __s0_835, 7, 6, 5, 4, 3, 2, 1, 0); \ 69315 __ret_835 = __builtin_bit_cast(float16_t, __noswap_vgetq_lane_s16(__builtin_bit_cast(int16x8_t, __rev0_835), __p1_835)); \ 69316 __ret_835; \ 69317 }) 69318 #define __noswap_vgetq_lane_f16(__p0_836, __p1_836) __extension__ ({ \ 69319 float16_t __ret_836; \ 69320 float16x8_t __s0_836 = __p0_836; \ 69321 __ret_836 = __builtin_bit_cast(float16_t, __noswap_vgetq_lane_s16(__builtin_bit_cast(int16x8_t, __s0_836), __p1_836)); \ 69322 __ret_836; \ 69323 }) 69324 #endif 69325 69326 #ifdef __LITTLE_ENDIAN__ 69327 __ai __attribute__((target("neon"))) uint16x8_t vmlal_u8(uint16x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) { 69328 uint16x8_t __ret; 69329 __ret = __p0 + vmull_u8(__p1, __p2); 69330 return __ret; 69331 } 69332 #else 69333 __ai __attribute__((target("neon"))) uint16x8_t vmlal_u8(uint16x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) { 69334 uint16x8_t __ret; 69335 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 69336 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 69337 uint8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 69338 __ret = __rev0 + __noswap_vmull_u8(__rev1, __rev2); 69339 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 69340 return __ret; 69341 } 69342 __ai __attribute__((target("neon"))) uint16x8_t __noswap_vmlal_u8(uint16x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) { 69343 uint16x8_t __ret; 69344 __ret = __p0 + __noswap_vmull_u8(__p1, __p2); 69345 return __ret; 69346 } 69347 #endif 69348 69349 #ifdef __LITTLE_ENDIAN__ 69350 __ai __attribute__((target("neon"))) uint64x2_t vmlal_u32(uint64x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) { 69351 uint64x2_t __ret; 69352 __ret = __p0 + vmull_u32(__p1, __p2); 69353 return __ret; 69354 } 69355 #else 69356 __ai __attribute__((target("neon"))) uint64x2_t vmlal_u32(uint64x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) { 69357 uint64x2_t __ret; 69358 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 69359 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 69360 uint32x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 69361 __ret = __rev0 + __noswap_vmull_u32(__rev1, __rev2); 69362 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 69363 return __ret; 69364 } 69365 __ai __attribute__((target("neon"))) uint64x2_t __noswap_vmlal_u32(uint64x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) { 69366 uint64x2_t __ret; 69367 __ret = __p0 + __noswap_vmull_u32(__p1, __p2); 69368 return __ret; 69369 } 69370 #endif 69371 69372 #ifdef __LITTLE_ENDIAN__ 69373 __ai __attribute__((target("neon"))) uint32x4_t vmlal_u16(uint32x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) { 69374 uint32x4_t __ret; 69375 __ret = __p0 + vmull_u16(__p1, __p2); 69376 return __ret; 69377 } 69378 #else 69379 __ai __attribute__((target("neon"))) uint32x4_t vmlal_u16(uint32x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) { 69380 uint32x4_t __ret; 69381 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 69382 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 69383 uint16x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 69384 __ret = __rev0 + __noswap_vmull_u16(__rev1, __rev2); 69385 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 69386 return __ret; 69387 } 69388 __ai __attribute__((target("neon"))) uint32x4_t __noswap_vmlal_u16(uint32x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) { 69389 uint32x4_t __ret; 69390 __ret = __p0 + __noswap_vmull_u16(__p1, __p2); 69391 return __ret; 69392 } 69393 #endif 69394 69395 #ifdef __LITTLE_ENDIAN__ 69396 __ai __attribute__((target("neon"))) int16x8_t vmlal_s8(int16x8_t __p0, int8x8_t __p1, int8x8_t __p2) { 69397 int16x8_t __ret; 69398 __ret = __p0 + vmull_s8(__p1, __p2); 69399 return __ret; 69400 } 69401 #else 69402 __ai __attribute__((target("neon"))) int16x8_t vmlal_s8(int16x8_t __p0, int8x8_t __p1, int8x8_t __p2) { 69403 int16x8_t __ret; 69404 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 69405 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 69406 int8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 69407 __ret = __rev0 + __noswap_vmull_s8(__rev1, __rev2); 69408 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 69409 return __ret; 69410 } 69411 __ai __attribute__((target("neon"))) int16x8_t __noswap_vmlal_s8(int16x8_t __p0, int8x8_t __p1, int8x8_t __p2) { 69412 int16x8_t __ret; 69413 __ret = __p0 + __noswap_vmull_s8(__p1, __p2); 69414 return __ret; 69415 } 69416 #endif 69417 69418 #ifdef __LITTLE_ENDIAN__ 69419 __ai __attribute__((target("neon"))) int64x2_t vmlal_s32(int64x2_t __p0, int32x2_t __p1, int32x2_t __p2) { 69420 int64x2_t __ret; 69421 __ret = __p0 + vmull_s32(__p1, __p2); 69422 return __ret; 69423 } 69424 #else 69425 __ai __attribute__((target("neon"))) int64x2_t vmlal_s32(int64x2_t __p0, int32x2_t __p1, int32x2_t __p2) { 69426 int64x2_t __ret; 69427 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 69428 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 69429 int32x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 69430 __ret = __rev0 + __noswap_vmull_s32(__rev1, __rev2); 69431 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 69432 return __ret; 69433 } 69434 __ai __attribute__((target("neon"))) int64x2_t __noswap_vmlal_s32(int64x2_t __p0, int32x2_t __p1, int32x2_t __p2) { 69435 int64x2_t __ret; 69436 __ret = __p0 + __noswap_vmull_s32(__p1, __p2); 69437 return __ret; 69438 } 69439 #endif 69440 69441 #ifdef __LITTLE_ENDIAN__ 69442 __ai __attribute__((target("neon"))) int32x4_t vmlal_s16(int32x4_t __p0, int16x4_t __p1, int16x4_t __p2) { 69443 int32x4_t __ret; 69444 __ret = __p0 + vmull_s16(__p1, __p2); 69445 return __ret; 69446 } 69447 #else 69448 __ai __attribute__((target("neon"))) int32x4_t vmlal_s16(int32x4_t __p0, int16x4_t __p1, int16x4_t __p2) { 69449 int32x4_t __ret; 69450 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 69451 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 69452 int16x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 69453 __ret = __rev0 + __noswap_vmull_s16(__rev1, __rev2); 69454 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 69455 return __ret; 69456 } 69457 __ai __attribute__((target("neon"))) int32x4_t __noswap_vmlal_s16(int32x4_t __p0, int16x4_t __p1, int16x4_t __p2) { 69458 int32x4_t __ret; 69459 __ret = __p0 + __noswap_vmull_s16(__p1, __p2); 69460 return __ret; 69461 } 69462 #endif 69463 69464 #ifdef __LITTLE_ENDIAN__ 69465 #define vmlal_lane_u32(__p0_837, __p1_837, __p2_837, __p3_837) __extension__ ({ \ 69466 uint64x2_t __ret_837; \ 69467 uint64x2_t __s0_837 = __p0_837; \ 69468 uint32x2_t __s1_837 = __p1_837; \ 69469 uint32x2_t __s2_837 = __p2_837; \ 69470 __ret_837 = __s0_837 + vmull_u32(__s1_837, splat_lane_u32(__s2_837, __p3_837)); \ 69471 __ret_837; \ 69472 }) 69473 #else 69474 #define vmlal_lane_u32(__p0_838, __p1_838, __p2_838, __p3_838) __extension__ ({ \ 69475 uint64x2_t __ret_838; \ 69476 uint64x2_t __s0_838 = __p0_838; \ 69477 uint32x2_t __s1_838 = __p1_838; \ 69478 uint32x2_t __s2_838 = __p2_838; \ 69479 uint64x2_t __rev0_838; __rev0_838 = __builtin_shufflevector(__s0_838, __s0_838, 1, 0); \ 69480 uint32x2_t __rev1_838; __rev1_838 = __builtin_shufflevector(__s1_838, __s1_838, 1, 0); \ 69481 uint32x2_t __rev2_838; __rev2_838 = __builtin_shufflevector(__s2_838, __s2_838, 1, 0); \ 69482 __ret_838 = __rev0_838 + __noswap_vmull_u32(__rev1_838, __noswap_splat_lane_u32(__rev2_838, __p3_838)); \ 69483 __ret_838 = __builtin_shufflevector(__ret_838, __ret_838, 1, 0); \ 69484 __ret_838; \ 69485 }) 69486 #endif 69487 69488 #ifdef __LITTLE_ENDIAN__ 69489 #define vmlal_lane_u16(__p0_839, __p1_839, __p2_839, __p3_839) __extension__ ({ \ 69490 uint32x4_t __ret_839; \ 69491 uint32x4_t __s0_839 = __p0_839; \ 69492 uint16x4_t __s1_839 = __p1_839; \ 69493 uint16x4_t __s2_839 = __p2_839; \ 69494 __ret_839 = __s0_839 + vmull_u16(__s1_839, splat_lane_u16(__s2_839, __p3_839)); \ 69495 __ret_839; \ 69496 }) 69497 #else 69498 #define vmlal_lane_u16(__p0_840, __p1_840, __p2_840, __p3_840) __extension__ ({ \ 69499 uint32x4_t __ret_840; \ 69500 uint32x4_t __s0_840 = __p0_840; \ 69501 uint16x4_t __s1_840 = __p1_840; \ 69502 uint16x4_t __s2_840 = __p2_840; \ 69503 uint32x4_t __rev0_840; __rev0_840 = __builtin_shufflevector(__s0_840, __s0_840, 3, 2, 1, 0); \ 69504 uint16x4_t __rev1_840; __rev1_840 = __builtin_shufflevector(__s1_840, __s1_840, 3, 2, 1, 0); \ 69505 uint16x4_t __rev2_840; __rev2_840 = __builtin_shufflevector(__s2_840, __s2_840, 3, 2, 1, 0); \ 69506 __ret_840 = __rev0_840 + __noswap_vmull_u16(__rev1_840, __noswap_splat_lane_u16(__rev2_840, __p3_840)); \ 69507 __ret_840 = __builtin_shufflevector(__ret_840, __ret_840, 3, 2, 1, 0); \ 69508 __ret_840; \ 69509 }) 69510 #endif 69511 69512 #ifdef __LITTLE_ENDIAN__ 69513 #define vmlal_lane_s32(__p0_841, __p1_841, __p2_841, __p3_841) __extension__ ({ \ 69514 int64x2_t __ret_841; \ 69515 int64x2_t __s0_841 = __p0_841; \ 69516 int32x2_t __s1_841 = __p1_841; \ 69517 int32x2_t __s2_841 = __p2_841; \ 69518 __ret_841 = __s0_841 + vmull_s32(__s1_841, splat_lane_s32(__s2_841, __p3_841)); \ 69519 __ret_841; \ 69520 }) 69521 #else 69522 #define vmlal_lane_s32(__p0_842, __p1_842, __p2_842, __p3_842) __extension__ ({ \ 69523 int64x2_t __ret_842; \ 69524 int64x2_t __s0_842 = __p0_842; \ 69525 int32x2_t __s1_842 = __p1_842; \ 69526 int32x2_t __s2_842 = __p2_842; \ 69527 int64x2_t __rev0_842; __rev0_842 = __builtin_shufflevector(__s0_842, __s0_842, 1, 0); \ 69528 int32x2_t __rev1_842; __rev1_842 = __builtin_shufflevector(__s1_842, __s1_842, 1, 0); \ 69529 int32x2_t __rev2_842; __rev2_842 = __builtin_shufflevector(__s2_842, __s2_842, 1, 0); \ 69530 __ret_842 = __rev0_842 + __noswap_vmull_s32(__rev1_842, __noswap_splat_lane_s32(__rev2_842, __p3_842)); \ 69531 __ret_842 = __builtin_shufflevector(__ret_842, __ret_842, 1, 0); \ 69532 __ret_842; \ 69533 }) 69534 #endif 69535 69536 #ifdef __LITTLE_ENDIAN__ 69537 #define vmlal_lane_s16(__p0_843, __p1_843, __p2_843, __p3_843) __extension__ ({ \ 69538 int32x4_t __ret_843; \ 69539 int32x4_t __s0_843 = __p0_843; \ 69540 int16x4_t __s1_843 = __p1_843; \ 69541 int16x4_t __s2_843 = __p2_843; \ 69542 __ret_843 = __s0_843 + vmull_s16(__s1_843, splat_lane_s16(__s2_843, __p3_843)); \ 69543 __ret_843; \ 69544 }) 69545 #else 69546 #define vmlal_lane_s16(__p0_844, __p1_844, __p2_844, __p3_844) __extension__ ({ \ 69547 int32x4_t __ret_844; \ 69548 int32x4_t __s0_844 = __p0_844; \ 69549 int16x4_t __s1_844 = __p1_844; \ 69550 int16x4_t __s2_844 = __p2_844; \ 69551 int32x4_t __rev0_844; __rev0_844 = __builtin_shufflevector(__s0_844, __s0_844, 3, 2, 1, 0); \ 69552 int16x4_t __rev1_844; __rev1_844 = __builtin_shufflevector(__s1_844, __s1_844, 3, 2, 1, 0); \ 69553 int16x4_t __rev2_844; __rev2_844 = __builtin_shufflevector(__s2_844, __s2_844, 3, 2, 1, 0); \ 69554 __ret_844 = __rev0_844 + __noswap_vmull_s16(__rev1_844, __noswap_splat_lane_s16(__rev2_844, __p3_844)); \ 69555 __ret_844 = __builtin_shufflevector(__ret_844, __ret_844, 3, 2, 1, 0); \ 69556 __ret_844; \ 69557 }) 69558 #endif 69559 69560 #ifdef __LITTLE_ENDIAN__ 69561 __ai __attribute__((target("neon"))) uint64x2_t vmlal_n_u32(uint64x2_t __p0, uint32x2_t __p1, uint32_t __p2) { 69562 uint64x2_t __ret; 69563 __ret = __p0 + vmull_u32(__p1, (uint32x2_t) {__p2, __p2}); 69564 return __ret; 69565 } 69566 #else 69567 __ai __attribute__((target("neon"))) uint64x2_t vmlal_n_u32(uint64x2_t __p0, uint32x2_t __p1, uint32_t __p2) { 69568 uint64x2_t __ret; 69569 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 69570 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 69571 __ret = __rev0 + __noswap_vmull_u32(__rev1, (uint32x2_t) {__p2, __p2}); 69572 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 69573 return __ret; 69574 } 69575 __ai __attribute__((target("neon"))) uint64x2_t __noswap_vmlal_n_u32(uint64x2_t __p0, uint32x2_t __p1, uint32_t __p2) { 69576 uint64x2_t __ret; 69577 __ret = __p0 + __noswap_vmull_u32(__p1, (uint32x2_t) {__p2, __p2}); 69578 return __ret; 69579 } 69580 #endif 69581 69582 #ifdef __LITTLE_ENDIAN__ 69583 __ai __attribute__((target("neon"))) uint32x4_t vmlal_n_u16(uint32x4_t __p0, uint16x4_t __p1, uint16_t __p2) { 69584 uint32x4_t __ret; 69585 __ret = __p0 + vmull_u16(__p1, (uint16x4_t) {__p2, __p2, __p2, __p2}); 69586 return __ret; 69587 } 69588 #else 69589 __ai __attribute__((target("neon"))) uint32x4_t vmlal_n_u16(uint32x4_t __p0, uint16x4_t __p1, uint16_t __p2) { 69590 uint32x4_t __ret; 69591 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 69592 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 69593 __ret = __rev0 + __noswap_vmull_u16(__rev1, (uint16x4_t) {__p2, __p2, __p2, __p2}); 69594 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 69595 return __ret; 69596 } 69597 __ai __attribute__((target("neon"))) uint32x4_t __noswap_vmlal_n_u16(uint32x4_t __p0, uint16x4_t __p1, uint16_t __p2) { 69598 uint32x4_t __ret; 69599 __ret = __p0 + __noswap_vmull_u16(__p1, (uint16x4_t) {__p2, __p2, __p2, __p2}); 69600 return __ret; 69601 } 69602 #endif 69603 69604 #ifdef __LITTLE_ENDIAN__ 69605 __ai __attribute__((target("neon"))) int64x2_t vmlal_n_s32(int64x2_t __p0, int32x2_t __p1, int32_t __p2) { 69606 int64x2_t __ret; 69607 __ret = __p0 + vmull_s32(__p1, (int32x2_t) {__p2, __p2}); 69608 return __ret; 69609 } 69610 #else 69611 __ai __attribute__((target("neon"))) int64x2_t vmlal_n_s32(int64x2_t __p0, int32x2_t __p1, int32_t __p2) { 69612 int64x2_t __ret; 69613 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 69614 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 69615 __ret = __rev0 + __noswap_vmull_s32(__rev1, (int32x2_t) {__p2, __p2}); 69616 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 69617 return __ret; 69618 } 69619 __ai __attribute__((target("neon"))) int64x2_t __noswap_vmlal_n_s32(int64x2_t __p0, int32x2_t __p1, int32_t __p2) { 69620 int64x2_t __ret; 69621 __ret = __p0 + __noswap_vmull_s32(__p1, (int32x2_t) {__p2, __p2}); 69622 return __ret; 69623 } 69624 #endif 69625 69626 #ifdef __LITTLE_ENDIAN__ 69627 __ai __attribute__((target("neon"))) int32x4_t vmlal_n_s16(int32x4_t __p0, int16x4_t __p1, int16_t __p2) { 69628 int32x4_t __ret; 69629 __ret = __p0 + vmull_s16(__p1, (int16x4_t) {__p2, __p2, __p2, __p2}); 69630 return __ret; 69631 } 69632 #else 69633 __ai __attribute__((target("neon"))) int32x4_t vmlal_n_s16(int32x4_t __p0, int16x4_t __p1, int16_t __p2) { 69634 int32x4_t __ret; 69635 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 69636 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 69637 __ret = __rev0 + __noswap_vmull_s16(__rev1, (int16x4_t) {__p2, __p2, __p2, __p2}); 69638 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 69639 return __ret; 69640 } 69641 __ai __attribute__((target("neon"))) int32x4_t __noswap_vmlal_n_s16(int32x4_t __p0, int16x4_t __p1, int16_t __p2) { 69642 int32x4_t __ret; 69643 __ret = __p0 + __noswap_vmull_s16(__p1, (int16x4_t) {__p2, __p2, __p2, __p2}); 69644 return __ret; 69645 } 69646 #endif 69647 69648 #ifdef __LITTLE_ENDIAN__ 69649 __ai __attribute__((target("neon"))) uint16x8_t vmlsl_u8(uint16x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) { 69650 uint16x8_t __ret; 69651 __ret = __p0 - vmull_u8(__p1, __p2); 69652 return __ret; 69653 } 69654 #else 69655 __ai __attribute__((target("neon"))) uint16x8_t vmlsl_u8(uint16x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) { 69656 uint16x8_t __ret; 69657 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 69658 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 69659 uint8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 69660 __ret = __rev0 - __noswap_vmull_u8(__rev1, __rev2); 69661 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 69662 return __ret; 69663 } 69664 __ai __attribute__((target("neon"))) uint16x8_t __noswap_vmlsl_u8(uint16x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) { 69665 uint16x8_t __ret; 69666 __ret = __p0 - __noswap_vmull_u8(__p1, __p2); 69667 return __ret; 69668 } 69669 #endif 69670 69671 #ifdef __LITTLE_ENDIAN__ 69672 __ai __attribute__((target("neon"))) uint64x2_t vmlsl_u32(uint64x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) { 69673 uint64x2_t __ret; 69674 __ret = __p0 - vmull_u32(__p1, __p2); 69675 return __ret; 69676 } 69677 #else 69678 __ai __attribute__((target("neon"))) uint64x2_t vmlsl_u32(uint64x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) { 69679 uint64x2_t __ret; 69680 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 69681 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 69682 uint32x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 69683 __ret = __rev0 - __noswap_vmull_u32(__rev1, __rev2); 69684 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 69685 return __ret; 69686 } 69687 __ai __attribute__((target("neon"))) uint64x2_t __noswap_vmlsl_u32(uint64x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) { 69688 uint64x2_t __ret; 69689 __ret = __p0 - __noswap_vmull_u32(__p1, __p2); 69690 return __ret; 69691 } 69692 #endif 69693 69694 #ifdef __LITTLE_ENDIAN__ 69695 __ai __attribute__((target("neon"))) uint32x4_t vmlsl_u16(uint32x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) { 69696 uint32x4_t __ret; 69697 __ret = __p0 - vmull_u16(__p1, __p2); 69698 return __ret; 69699 } 69700 #else 69701 __ai __attribute__((target("neon"))) uint32x4_t vmlsl_u16(uint32x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) { 69702 uint32x4_t __ret; 69703 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 69704 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 69705 uint16x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 69706 __ret = __rev0 - __noswap_vmull_u16(__rev1, __rev2); 69707 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 69708 return __ret; 69709 } 69710 __ai __attribute__((target("neon"))) uint32x4_t __noswap_vmlsl_u16(uint32x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) { 69711 uint32x4_t __ret; 69712 __ret = __p0 - __noswap_vmull_u16(__p1, __p2); 69713 return __ret; 69714 } 69715 #endif 69716 69717 #ifdef __LITTLE_ENDIAN__ 69718 __ai __attribute__((target("neon"))) int16x8_t vmlsl_s8(int16x8_t __p0, int8x8_t __p1, int8x8_t __p2) { 69719 int16x8_t __ret; 69720 __ret = __p0 - vmull_s8(__p1, __p2); 69721 return __ret; 69722 } 69723 #else 69724 __ai __attribute__((target("neon"))) int16x8_t vmlsl_s8(int16x8_t __p0, int8x8_t __p1, int8x8_t __p2) { 69725 int16x8_t __ret; 69726 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 69727 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 69728 int8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 69729 __ret = __rev0 - __noswap_vmull_s8(__rev1, __rev2); 69730 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 69731 return __ret; 69732 } 69733 __ai __attribute__((target("neon"))) int16x8_t __noswap_vmlsl_s8(int16x8_t __p0, int8x8_t __p1, int8x8_t __p2) { 69734 int16x8_t __ret; 69735 __ret = __p0 - __noswap_vmull_s8(__p1, __p2); 69736 return __ret; 69737 } 69738 #endif 69739 69740 #ifdef __LITTLE_ENDIAN__ 69741 __ai __attribute__((target("neon"))) int64x2_t vmlsl_s32(int64x2_t __p0, int32x2_t __p1, int32x2_t __p2) { 69742 int64x2_t __ret; 69743 __ret = __p0 - vmull_s32(__p1, __p2); 69744 return __ret; 69745 } 69746 #else 69747 __ai __attribute__((target("neon"))) int64x2_t vmlsl_s32(int64x2_t __p0, int32x2_t __p1, int32x2_t __p2) { 69748 int64x2_t __ret; 69749 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 69750 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 69751 int32x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 69752 __ret = __rev0 - __noswap_vmull_s32(__rev1, __rev2); 69753 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 69754 return __ret; 69755 } 69756 __ai __attribute__((target("neon"))) int64x2_t __noswap_vmlsl_s32(int64x2_t __p0, int32x2_t __p1, int32x2_t __p2) { 69757 int64x2_t __ret; 69758 __ret = __p0 - __noswap_vmull_s32(__p1, __p2); 69759 return __ret; 69760 } 69761 #endif 69762 69763 #ifdef __LITTLE_ENDIAN__ 69764 __ai __attribute__((target("neon"))) int32x4_t vmlsl_s16(int32x4_t __p0, int16x4_t __p1, int16x4_t __p2) { 69765 int32x4_t __ret; 69766 __ret = __p0 - vmull_s16(__p1, __p2); 69767 return __ret; 69768 } 69769 #else 69770 __ai __attribute__((target("neon"))) int32x4_t vmlsl_s16(int32x4_t __p0, int16x4_t __p1, int16x4_t __p2) { 69771 int32x4_t __ret; 69772 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 69773 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 69774 int16x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 69775 __ret = __rev0 - __noswap_vmull_s16(__rev1, __rev2); 69776 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 69777 return __ret; 69778 } 69779 __ai __attribute__((target("neon"))) int32x4_t __noswap_vmlsl_s16(int32x4_t __p0, int16x4_t __p1, int16x4_t __p2) { 69780 int32x4_t __ret; 69781 __ret = __p0 - __noswap_vmull_s16(__p1, __p2); 69782 return __ret; 69783 } 69784 #endif 69785 69786 #ifdef __LITTLE_ENDIAN__ 69787 #define vmlsl_lane_u32(__p0_845, __p1_845, __p2_845, __p3_845) __extension__ ({ \ 69788 uint64x2_t __ret_845; \ 69789 uint64x2_t __s0_845 = __p0_845; \ 69790 uint32x2_t __s1_845 = __p1_845; \ 69791 uint32x2_t __s2_845 = __p2_845; \ 69792 __ret_845 = __s0_845 - vmull_u32(__s1_845, splat_lane_u32(__s2_845, __p3_845)); \ 69793 __ret_845; \ 69794 }) 69795 #else 69796 #define vmlsl_lane_u32(__p0_846, __p1_846, __p2_846, __p3_846) __extension__ ({ \ 69797 uint64x2_t __ret_846; \ 69798 uint64x2_t __s0_846 = __p0_846; \ 69799 uint32x2_t __s1_846 = __p1_846; \ 69800 uint32x2_t __s2_846 = __p2_846; \ 69801 uint64x2_t __rev0_846; __rev0_846 = __builtin_shufflevector(__s0_846, __s0_846, 1, 0); \ 69802 uint32x2_t __rev1_846; __rev1_846 = __builtin_shufflevector(__s1_846, __s1_846, 1, 0); \ 69803 uint32x2_t __rev2_846; __rev2_846 = __builtin_shufflevector(__s2_846, __s2_846, 1, 0); \ 69804 __ret_846 = __rev0_846 - __noswap_vmull_u32(__rev1_846, __noswap_splat_lane_u32(__rev2_846, __p3_846)); \ 69805 __ret_846 = __builtin_shufflevector(__ret_846, __ret_846, 1, 0); \ 69806 __ret_846; \ 69807 }) 69808 #endif 69809 69810 #ifdef __LITTLE_ENDIAN__ 69811 #define vmlsl_lane_u16(__p0_847, __p1_847, __p2_847, __p3_847) __extension__ ({ \ 69812 uint32x4_t __ret_847; \ 69813 uint32x4_t __s0_847 = __p0_847; \ 69814 uint16x4_t __s1_847 = __p1_847; \ 69815 uint16x4_t __s2_847 = __p2_847; \ 69816 __ret_847 = __s0_847 - vmull_u16(__s1_847, splat_lane_u16(__s2_847, __p3_847)); \ 69817 __ret_847; \ 69818 }) 69819 #else 69820 #define vmlsl_lane_u16(__p0_848, __p1_848, __p2_848, __p3_848) __extension__ ({ \ 69821 uint32x4_t __ret_848; \ 69822 uint32x4_t __s0_848 = __p0_848; \ 69823 uint16x4_t __s1_848 = __p1_848; \ 69824 uint16x4_t __s2_848 = __p2_848; \ 69825 uint32x4_t __rev0_848; __rev0_848 = __builtin_shufflevector(__s0_848, __s0_848, 3, 2, 1, 0); \ 69826 uint16x4_t __rev1_848; __rev1_848 = __builtin_shufflevector(__s1_848, __s1_848, 3, 2, 1, 0); \ 69827 uint16x4_t __rev2_848; __rev2_848 = __builtin_shufflevector(__s2_848, __s2_848, 3, 2, 1, 0); \ 69828 __ret_848 = __rev0_848 - __noswap_vmull_u16(__rev1_848, __noswap_splat_lane_u16(__rev2_848, __p3_848)); \ 69829 __ret_848 = __builtin_shufflevector(__ret_848, __ret_848, 3, 2, 1, 0); \ 69830 __ret_848; \ 69831 }) 69832 #endif 69833 69834 #ifdef __LITTLE_ENDIAN__ 69835 #define vmlsl_lane_s32(__p0_849, __p1_849, __p2_849, __p3_849) __extension__ ({ \ 69836 int64x2_t __ret_849; \ 69837 int64x2_t __s0_849 = __p0_849; \ 69838 int32x2_t __s1_849 = __p1_849; \ 69839 int32x2_t __s2_849 = __p2_849; \ 69840 __ret_849 = __s0_849 - vmull_s32(__s1_849, splat_lane_s32(__s2_849, __p3_849)); \ 69841 __ret_849; \ 69842 }) 69843 #else 69844 #define vmlsl_lane_s32(__p0_850, __p1_850, __p2_850, __p3_850) __extension__ ({ \ 69845 int64x2_t __ret_850; \ 69846 int64x2_t __s0_850 = __p0_850; \ 69847 int32x2_t __s1_850 = __p1_850; \ 69848 int32x2_t __s2_850 = __p2_850; \ 69849 int64x2_t __rev0_850; __rev0_850 = __builtin_shufflevector(__s0_850, __s0_850, 1, 0); \ 69850 int32x2_t __rev1_850; __rev1_850 = __builtin_shufflevector(__s1_850, __s1_850, 1, 0); \ 69851 int32x2_t __rev2_850; __rev2_850 = __builtin_shufflevector(__s2_850, __s2_850, 1, 0); \ 69852 __ret_850 = __rev0_850 - __noswap_vmull_s32(__rev1_850, __noswap_splat_lane_s32(__rev2_850, __p3_850)); \ 69853 __ret_850 = __builtin_shufflevector(__ret_850, __ret_850, 1, 0); \ 69854 __ret_850; \ 69855 }) 69856 #endif 69857 69858 #ifdef __LITTLE_ENDIAN__ 69859 #define vmlsl_lane_s16(__p0_851, __p1_851, __p2_851, __p3_851) __extension__ ({ \ 69860 int32x4_t __ret_851; \ 69861 int32x4_t __s0_851 = __p0_851; \ 69862 int16x4_t __s1_851 = __p1_851; \ 69863 int16x4_t __s2_851 = __p2_851; \ 69864 __ret_851 = __s0_851 - vmull_s16(__s1_851, splat_lane_s16(__s2_851, __p3_851)); \ 69865 __ret_851; \ 69866 }) 69867 #else 69868 #define vmlsl_lane_s16(__p0_852, __p1_852, __p2_852, __p3_852) __extension__ ({ \ 69869 int32x4_t __ret_852; \ 69870 int32x4_t __s0_852 = __p0_852; \ 69871 int16x4_t __s1_852 = __p1_852; \ 69872 int16x4_t __s2_852 = __p2_852; \ 69873 int32x4_t __rev0_852; __rev0_852 = __builtin_shufflevector(__s0_852, __s0_852, 3, 2, 1, 0); \ 69874 int16x4_t __rev1_852; __rev1_852 = __builtin_shufflevector(__s1_852, __s1_852, 3, 2, 1, 0); \ 69875 int16x4_t __rev2_852; __rev2_852 = __builtin_shufflevector(__s2_852, __s2_852, 3, 2, 1, 0); \ 69876 __ret_852 = __rev0_852 - __noswap_vmull_s16(__rev1_852, __noswap_splat_lane_s16(__rev2_852, __p3_852)); \ 69877 __ret_852 = __builtin_shufflevector(__ret_852, __ret_852, 3, 2, 1, 0); \ 69878 __ret_852; \ 69879 }) 69880 #endif 69881 69882 #ifdef __LITTLE_ENDIAN__ 69883 __ai __attribute__((target("neon"))) uint64x2_t vmlsl_n_u32(uint64x2_t __p0, uint32x2_t __p1, uint32_t __p2) { 69884 uint64x2_t __ret; 69885 __ret = __p0 - vmull_u32(__p1, (uint32x2_t) {__p2, __p2}); 69886 return __ret; 69887 } 69888 #else 69889 __ai __attribute__((target("neon"))) uint64x2_t vmlsl_n_u32(uint64x2_t __p0, uint32x2_t __p1, uint32_t __p2) { 69890 uint64x2_t __ret; 69891 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 69892 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 69893 __ret = __rev0 - __noswap_vmull_u32(__rev1, (uint32x2_t) {__p2, __p2}); 69894 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 69895 return __ret; 69896 } 69897 __ai __attribute__((target("neon"))) uint64x2_t __noswap_vmlsl_n_u32(uint64x2_t __p0, uint32x2_t __p1, uint32_t __p2) { 69898 uint64x2_t __ret; 69899 __ret = __p0 - __noswap_vmull_u32(__p1, (uint32x2_t) {__p2, __p2}); 69900 return __ret; 69901 } 69902 #endif 69903 69904 #ifdef __LITTLE_ENDIAN__ 69905 __ai __attribute__((target("neon"))) uint32x4_t vmlsl_n_u16(uint32x4_t __p0, uint16x4_t __p1, uint16_t __p2) { 69906 uint32x4_t __ret; 69907 __ret = __p0 - vmull_u16(__p1, (uint16x4_t) {__p2, __p2, __p2, __p2}); 69908 return __ret; 69909 } 69910 #else 69911 __ai __attribute__((target("neon"))) uint32x4_t vmlsl_n_u16(uint32x4_t __p0, uint16x4_t __p1, uint16_t __p2) { 69912 uint32x4_t __ret; 69913 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 69914 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 69915 __ret = __rev0 - __noswap_vmull_u16(__rev1, (uint16x4_t) {__p2, __p2, __p2, __p2}); 69916 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 69917 return __ret; 69918 } 69919 __ai __attribute__((target("neon"))) uint32x4_t __noswap_vmlsl_n_u16(uint32x4_t __p0, uint16x4_t __p1, uint16_t __p2) { 69920 uint32x4_t __ret; 69921 __ret = __p0 - __noswap_vmull_u16(__p1, (uint16x4_t) {__p2, __p2, __p2, __p2}); 69922 return __ret; 69923 } 69924 #endif 69925 69926 #ifdef __LITTLE_ENDIAN__ 69927 __ai __attribute__((target("neon"))) int64x2_t vmlsl_n_s32(int64x2_t __p0, int32x2_t __p1, int32_t __p2) { 69928 int64x2_t __ret; 69929 __ret = __p0 - vmull_s32(__p1, (int32x2_t) {__p2, __p2}); 69930 return __ret; 69931 } 69932 #else 69933 __ai __attribute__((target("neon"))) int64x2_t vmlsl_n_s32(int64x2_t __p0, int32x2_t __p1, int32_t __p2) { 69934 int64x2_t __ret; 69935 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 69936 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 69937 __ret = __rev0 - __noswap_vmull_s32(__rev1, (int32x2_t) {__p2, __p2}); 69938 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 69939 return __ret; 69940 } 69941 __ai __attribute__((target("neon"))) int64x2_t __noswap_vmlsl_n_s32(int64x2_t __p0, int32x2_t __p1, int32_t __p2) { 69942 int64x2_t __ret; 69943 __ret = __p0 - __noswap_vmull_s32(__p1, (int32x2_t) {__p2, __p2}); 69944 return __ret; 69945 } 69946 #endif 69947 69948 #ifdef __LITTLE_ENDIAN__ 69949 __ai __attribute__((target("neon"))) int32x4_t vmlsl_n_s16(int32x4_t __p0, int16x4_t __p1, int16_t __p2) { 69950 int32x4_t __ret; 69951 __ret = __p0 - vmull_s16(__p1, (int16x4_t) {__p2, __p2, __p2, __p2}); 69952 return __ret; 69953 } 69954 #else 69955 __ai __attribute__((target("neon"))) int32x4_t vmlsl_n_s16(int32x4_t __p0, int16x4_t __p1, int16_t __p2) { 69956 int32x4_t __ret; 69957 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 69958 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 69959 __ret = __rev0 - __noswap_vmull_s16(__rev1, (int16x4_t) {__p2, __p2, __p2, __p2}); 69960 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 69961 return __ret; 69962 } 69963 __ai __attribute__((target("neon"))) int32x4_t __noswap_vmlsl_n_s16(int32x4_t __p0, int16x4_t __p1, int16_t __p2) { 69964 int32x4_t __ret; 69965 __ret = __p0 - __noswap_vmull_s16(__p1, (int16x4_t) {__p2, __p2, __p2, __p2}); 69966 return __ret; 69967 } 69968 #endif 69969 69970 #ifdef __LITTLE_ENDIAN__ 69971 #define vset_lane_f16(__p0_853, __p1_853, __p2_853) __extension__ ({ \ 69972 float16x4_t __ret_853; \ 69973 float16_t __s0_853 = __p0_853; \ 69974 float16x4_t __s1_853 = __p1_853; \ 69975 __ret_853 = __builtin_bit_cast(float16x4_t, vset_lane_s16(__builtin_bit_cast(int16_t, __s0_853), __builtin_bit_cast(int16x4_t, __s1_853), __p2_853)); \ 69976 __ret_853; \ 69977 }) 69978 #else 69979 #define vset_lane_f16(__p0_854, __p1_854, __p2_854) __extension__ ({ \ 69980 float16x4_t __ret_854; \ 69981 float16_t __s0_854 = __p0_854; \ 69982 float16x4_t __s1_854 = __p1_854; \ 69983 float16x4_t __rev1_854; __rev1_854 = __builtin_shufflevector(__s1_854, __s1_854, 3, 2, 1, 0); \ 69984 __ret_854 = __builtin_bit_cast(float16x4_t, __noswap_vset_lane_s16(__builtin_bit_cast(int16_t, __s0_854), __builtin_bit_cast(int16x4_t, __rev1_854), __p2_854)); \ 69985 __ret_854 = __builtin_shufflevector(__ret_854, __ret_854, 3, 2, 1, 0); \ 69986 __ret_854; \ 69987 }) 69988 #endif 69989 69990 #ifdef __LITTLE_ENDIAN__ 69991 #define vsetq_lane_f16(__p0_855, __p1_855, __p2_855) __extension__ ({ \ 69992 float16x8_t __ret_855; \ 69993 float16_t __s0_855 = __p0_855; \ 69994 float16x8_t __s1_855 = __p1_855; \ 69995 __ret_855 = __builtin_bit_cast(float16x8_t, vsetq_lane_s16(__builtin_bit_cast(int16_t, __s0_855), __builtin_bit_cast(int16x8_t, __s1_855), __p2_855)); \ 69996 __ret_855; \ 69997 }) 69998 #else 69999 #define vsetq_lane_f16(__p0_856, __p1_856, __p2_856) __extension__ ({ \ 70000 float16x8_t __ret_856; \ 70001 float16_t __s0_856 = __p0_856; \ 70002 float16x8_t __s1_856 = __p1_856; \ 70003 float16x8_t __rev1_856; __rev1_856 = __builtin_shufflevector(__s1_856, __s1_856, 7, 6, 5, 4, 3, 2, 1, 0); \ 70004 __ret_856 = __builtin_bit_cast(float16x8_t, __noswap_vsetq_lane_s16(__builtin_bit_cast(int16_t, __s0_856), __builtin_bit_cast(int16x8_t, __rev1_856), __p2_856)); \ 70005 __ret_856 = __builtin_shufflevector(__ret_856, __ret_856, 7, 6, 5, 4, 3, 2, 1, 0); \ 70006 __ret_856; \ 70007 }) 70008 #endif 70009 70010 #if defined(__aarch64__) || defined(__arm64ec__) 70011 #ifdef __LITTLE_ENDIAN__ 70012 __ai __attribute__((target("aes,neon"))) poly128_t vmull_high_p64(poly64x2_t __p0, poly64x2_t __p1) { 70013 poly128_t __ret; 70014 __ret = vmull_p64((poly64_t)(vget_high_p64(__p0)), (poly64_t)(vget_high_p64(__p1))); 70015 return __ret; 70016 } 70017 #else 70018 __ai __attribute__((target("aes,neon"))) poly128_t vmull_high_p64(poly64x2_t __p0, poly64x2_t __p1) { 70019 poly128_t __ret; 70020 poly64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 70021 poly64x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 70022 __ret = vmull_p64((poly64_t)(__noswap_vget_high_p64(__rev0)), (poly64_t)(__noswap_vget_high_p64(__rev1))); 70023 return __ret; 70024 } 70025 #endif 70026 70027 #ifdef __LITTLE_ENDIAN__ 70028 #define vfmlalq_lane_high_f16(__p0_857, __p1_857, __p2_857, __p3_857) __extension__ ({ \ 70029 float32x4_t __ret_857; \ 70030 float32x4_t __s0_857 = __p0_857; \ 70031 float16x8_t __s1_857 = __p1_857; \ 70032 float16x4_t __s2_857 = __p2_857; \ 70033 __ret_857 = vfmlalq_high_f16(__s0_857, __s1_857, (float16x8_t) {vget_lane_f16(__s2_857, __p3_857), vget_lane_f16(__s2_857, __p3_857), vget_lane_f16(__s2_857, __p3_857), vget_lane_f16(__s2_857, __p3_857), vget_lane_f16(__s2_857, __p3_857), vget_lane_f16(__s2_857, __p3_857), vget_lane_f16(__s2_857, __p3_857), vget_lane_f16(__s2_857, __p3_857)}); \ 70034 __ret_857; \ 70035 }) 70036 #else 70037 #define vfmlalq_lane_high_f16(__p0_858, __p1_858, __p2_858, __p3_858) __extension__ ({ \ 70038 float32x4_t __ret_858; \ 70039 float32x4_t __s0_858 = __p0_858; \ 70040 float16x8_t __s1_858 = __p1_858; \ 70041 float16x4_t __s2_858 = __p2_858; \ 70042 float32x4_t __rev0_858; __rev0_858 = __builtin_shufflevector(__s0_858, __s0_858, 3, 2, 1, 0); \ 70043 float16x8_t __rev1_858; __rev1_858 = __builtin_shufflevector(__s1_858, __s1_858, 7, 6, 5, 4, 3, 2, 1, 0); \ 70044 float16x4_t __rev2_858; __rev2_858 = __builtin_shufflevector(__s2_858, __s2_858, 3, 2, 1, 0); \ 70045 __ret_858 = __noswap_vfmlalq_high_f16(__rev0_858, __rev1_858, (float16x8_t) {__noswap_vget_lane_f16(__rev2_858, __p3_858), __noswap_vget_lane_f16(__rev2_858, __p3_858), __noswap_vget_lane_f16(__rev2_858, __p3_858), __noswap_vget_lane_f16(__rev2_858, __p3_858), __noswap_vget_lane_f16(__rev2_858, __p3_858), __noswap_vget_lane_f16(__rev2_858, __p3_858), __noswap_vget_lane_f16(__rev2_858, __p3_858), __noswap_vget_lane_f16(__rev2_858, __p3_858)}); \ 70046 __ret_858 = __builtin_shufflevector(__ret_858, __ret_858, 3, 2, 1, 0); \ 70047 __ret_858; \ 70048 }) 70049 #endif 70050 70051 #ifdef __LITTLE_ENDIAN__ 70052 #define vfmlal_lane_high_f16(__p0_859, __p1_859, __p2_859, __p3_859) __extension__ ({ \ 70053 float32x2_t __ret_859; \ 70054 float32x2_t __s0_859 = __p0_859; \ 70055 float16x4_t __s1_859 = __p1_859; \ 70056 float16x4_t __s2_859 = __p2_859; \ 70057 __ret_859 = vfmlal_high_f16(__s0_859, __s1_859, (float16x4_t) {vget_lane_f16(__s2_859, __p3_859), vget_lane_f16(__s2_859, __p3_859), vget_lane_f16(__s2_859, __p3_859), vget_lane_f16(__s2_859, __p3_859)}); \ 70058 __ret_859; \ 70059 }) 70060 #else 70061 #define vfmlal_lane_high_f16(__p0_860, __p1_860, __p2_860, __p3_860) __extension__ ({ \ 70062 float32x2_t __ret_860; \ 70063 float32x2_t __s0_860 = __p0_860; \ 70064 float16x4_t __s1_860 = __p1_860; \ 70065 float16x4_t __s2_860 = __p2_860; \ 70066 float32x2_t __rev0_860; __rev0_860 = __builtin_shufflevector(__s0_860, __s0_860, 1, 0); \ 70067 float16x4_t __rev1_860; __rev1_860 = __builtin_shufflevector(__s1_860, __s1_860, 3, 2, 1, 0); \ 70068 float16x4_t __rev2_860; __rev2_860 = __builtin_shufflevector(__s2_860, __s2_860, 3, 2, 1, 0); \ 70069 __ret_860 = __noswap_vfmlal_high_f16(__rev0_860, __rev1_860, (float16x4_t) {__noswap_vget_lane_f16(__rev2_860, __p3_860), __noswap_vget_lane_f16(__rev2_860, __p3_860), __noswap_vget_lane_f16(__rev2_860, __p3_860), __noswap_vget_lane_f16(__rev2_860, __p3_860)}); \ 70070 __ret_860 = __builtin_shufflevector(__ret_860, __ret_860, 1, 0); \ 70071 __ret_860; \ 70072 }) 70073 #endif 70074 70075 #ifdef __LITTLE_ENDIAN__ 70076 #define vfmlalq_lane_low_f16(__p0_861, __p1_861, __p2_861, __p3_861) __extension__ ({ \ 70077 float32x4_t __ret_861; \ 70078 float32x4_t __s0_861 = __p0_861; \ 70079 float16x8_t __s1_861 = __p1_861; \ 70080 float16x4_t __s2_861 = __p2_861; \ 70081 __ret_861 = vfmlalq_low_f16(__s0_861, __s1_861, (float16x8_t) {vget_lane_f16(__s2_861, __p3_861), vget_lane_f16(__s2_861, __p3_861), vget_lane_f16(__s2_861, __p3_861), vget_lane_f16(__s2_861, __p3_861), vget_lane_f16(__s2_861, __p3_861), vget_lane_f16(__s2_861, __p3_861), vget_lane_f16(__s2_861, __p3_861), vget_lane_f16(__s2_861, __p3_861)}); \ 70082 __ret_861; \ 70083 }) 70084 #else 70085 #define vfmlalq_lane_low_f16(__p0_862, __p1_862, __p2_862, __p3_862) __extension__ ({ \ 70086 float32x4_t __ret_862; \ 70087 float32x4_t __s0_862 = __p0_862; \ 70088 float16x8_t __s1_862 = __p1_862; \ 70089 float16x4_t __s2_862 = __p2_862; \ 70090 float32x4_t __rev0_862; __rev0_862 = __builtin_shufflevector(__s0_862, __s0_862, 3, 2, 1, 0); \ 70091 float16x8_t __rev1_862; __rev1_862 = __builtin_shufflevector(__s1_862, __s1_862, 7, 6, 5, 4, 3, 2, 1, 0); \ 70092 float16x4_t __rev2_862; __rev2_862 = __builtin_shufflevector(__s2_862, __s2_862, 3, 2, 1, 0); \ 70093 __ret_862 = __noswap_vfmlalq_low_f16(__rev0_862, __rev1_862, (float16x8_t) {__noswap_vget_lane_f16(__rev2_862, __p3_862), __noswap_vget_lane_f16(__rev2_862, __p3_862), __noswap_vget_lane_f16(__rev2_862, __p3_862), __noswap_vget_lane_f16(__rev2_862, __p3_862), __noswap_vget_lane_f16(__rev2_862, __p3_862), __noswap_vget_lane_f16(__rev2_862, __p3_862), __noswap_vget_lane_f16(__rev2_862, __p3_862), __noswap_vget_lane_f16(__rev2_862, __p3_862)}); \ 70094 __ret_862 = __builtin_shufflevector(__ret_862, __ret_862, 3, 2, 1, 0); \ 70095 __ret_862; \ 70096 }) 70097 #endif 70098 70099 #ifdef __LITTLE_ENDIAN__ 70100 #define vfmlal_lane_low_f16(__p0_863, __p1_863, __p2_863, __p3_863) __extension__ ({ \ 70101 float32x2_t __ret_863; \ 70102 float32x2_t __s0_863 = __p0_863; \ 70103 float16x4_t __s1_863 = __p1_863; \ 70104 float16x4_t __s2_863 = __p2_863; \ 70105 __ret_863 = vfmlal_low_f16(__s0_863, __s1_863, (float16x4_t) {vget_lane_f16(__s2_863, __p3_863), vget_lane_f16(__s2_863, __p3_863), vget_lane_f16(__s2_863, __p3_863), vget_lane_f16(__s2_863, __p3_863)}); \ 70106 __ret_863; \ 70107 }) 70108 #else 70109 #define vfmlal_lane_low_f16(__p0_864, __p1_864, __p2_864, __p3_864) __extension__ ({ \ 70110 float32x2_t __ret_864; \ 70111 float32x2_t __s0_864 = __p0_864; \ 70112 float16x4_t __s1_864 = __p1_864; \ 70113 float16x4_t __s2_864 = __p2_864; \ 70114 float32x2_t __rev0_864; __rev0_864 = __builtin_shufflevector(__s0_864, __s0_864, 1, 0); \ 70115 float16x4_t __rev1_864; __rev1_864 = __builtin_shufflevector(__s1_864, __s1_864, 3, 2, 1, 0); \ 70116 float16x4_t __rev2_864; __rev2_864 = __builtin_shufflevector(__s2_864, __s2_864, 3, 2, 1, 0); \ 70117 __ret_864 = __noswap_vfmlal_low_f16(__rev0_864, __rev1_864, (float16x4_t) {__noswap_vget_lane_f16(__rev2_864, __p3_864), __noswap_vget_lane_f16(__rev2_864, __p3_864), __noswap_vget_lane_f16(__rev2_864, __p3_864), __noswap_vget_lane_f16(__rev2_864, __p3_864)}); \ 70118 __ret_864 = __builtin_shufflevector(__ret_864, __ret_864, 1, 0); \ 70119 __ret_864; \ 70120 }) 70121 #endif 70122 70123 #ifdef __LITTLE_ENDIAN__ 70124 #define vfmlalq_laneq_high_f16(__p0_865, __p1_865, __p2_865, __p3_865) __extension__ ({ \ 70125 float32x4_t __ret_865; \ 70126 float32x4_t __s0_865 = __p0_865; \ 70127 float16x8_t __s1_865 = __p1_865; \ 70128 float16x8_t __s2_865 = __p2_865; \ 70129 __ret_865 = vfmlalq_high_f16(__s0_865, __s1_865, (float16x8_t) {vgetq_lane_f16(__s2_865, __p3_865), vgetq_lane_f16(__s2_865, __p3_865), vgetq_lane_f16(__s2_865, __p3_865), vgetq_lane_f16(__s2_865, __p3_865), vgetq_lane_f16(__s2_865, __p3_865), vgetq_lane_f16(__s2_865, __p3_865), vgetq_lane_f16(__s2_865, __p3_865), vgetq_lane_f16(__s2_865, __p3_865)}); \ 70130 __ret_865; \ 70131 }) 70132 #else 70133 #define vfmlalq_laneq_high_f16(__p0_866, __p1_866, __p2_866, __p3_866) __extension__ ({ \ 70134 float32x4_t __ret_866; \ 70135 float32x4_t __s0_866 = __p0_866; \ 70136 float16x8_t __s1_866 = __p1_866; \ 70137 float16x8_t __s2_866 = __p2_866; \ 70138 float32x4_t __rev0_866; __rev0_866 = __builtin_shufflevector(__s0_866, __s0_866, 3, 2, 1, 0); \ 70139 float16x8_t __rev1_866; __rev1_866 = __builtin_shufflevector(__s1_866, __s1_866, 7, 6, 5, 4, 3, 2, 1, 0); \ 70140 float16x8_t __rev2_866; __rev2_866 = __builtin_shufflevector(__s2_866, __s2_866, 7, 6, 5, 4, 3, 2, 1, 0); \ 70141 __ret_866 = __noswap_vfmlalq_high_f16(__rev0_866, __rev1_866, (float16x8_t) {__noswap_vgetq_lane_f16(__rev2_866, __p3_866), __noswap_vgetq_lane_f16(__rev2_866, __p3_866), __noswap_vgetq_lane_f16(__rev2_866, __p3_866), __noswap_vgetq_lane_f16(__rev2_866, __p3_866), __noswap_vgetq_lane_f16(__rev2_866, __p3_866), __noswap_vgetq_lane_f16(__rev2_866, __p3_866), __noswap_vgetq_lane_f16(__rev2_866, __p3_866), __noswap_vgetq_lane_f16(__rev2_866, __p3_866)}); \ 70142 __ret_866 = __builtin_shufflevector(__ret_866, __ret_866, 3, 2, 1, 0); \ 70143 __ret_866; \ 70144 }) 70145 #endif 70146 70147 #ifdef __LITTLE_ENDIAN__ 70148 #define vfmlal_laneq_high_f16(__p0_867, __p1_867, __p2_867, __p3_867) __extension__ ({ \ 70149 float32x2_t __ret_867; \ 70150 float32x2_t __s0_867 = __p0_867; \ 70151 float16x4_t __s1_867 = __p1_867; \ 70152 float16x8_t __s2_867 = __p2_867; \ 70153 __ret_867 = vfmlal_high_f16(__s0_867, __s1_867, (float16x4_t) {vgetq_lane_f16(__s2_867, __p3_867), vgetq_lane_f16(__s2_867, __p3_867), vgetq_lane_f16(__s2_867, __p3_867), vgetq_lane_f16(__s2_867, __p3_867)}); \ 70154 __ret_867; \ 70155 }) 70156 #else 70157 #define vfmlal_laneq_high_f16(__p0_868, __p1_868, __p2_868, __p3_868) __extension__ ({ \ 70158 float32x2_t __ret_868; \ 70159 float32x2_t __s0_868 = __p0_868; \ 70160 float16x4_t __s1_868 = __p1_868; \ 70161 float16x8_t __s2_868 = __p2_868; \ 70162 float32x2_t __rev0_868; __rev0_868 = __builtin_shufflevector(__s0_868, __s0_868, 1, 0); \ 70163 float16x4_t __rev1_868; __rev1_868 = __builtin_shufflevector(__s1_868, __s1_868, 3, 2, 1, 0); \ 70164 float16x8_t __rev2_868; __rev2_868 = __builtin_shufflevector(__s2_868, __s2_868, 7, 6, 5, 4, 3, 2, 1, 0); \ 70165 __ret_868 = __noswap_vfmlal_high_f16(__rev0_868, __rev1_868, (float16x4_t) {__noswap_vgetq_lane_f16(__rev2_868, __p3_868), __noswap_vgetq_lane_f16(__rev2_868, __p3_868), __noswap_vgetq_lane_f16(__rev2_868, __p3_868), __noswap_vgetq_lane_f16(__rev2_868, __p3_868)}); \ 70166 __ret_868 = __builtin_shufflevector(__ret_868, __ret_868, 1, 0); \ 70167 __ret_868; \ 70168 }) 70169 #endif 70170 70171 #ifdef __LITTLE_ENDIAN__ 70172 #define vfmlalq_laneq_low_f16(__p0_869, __p1_869, __p2_869, __p3_869) __extension__ ({ \ 70173 float32x4_t __ret_869; \ 70174 float32x4_t __s0_869 = __p0_869; \ 70175 float16x8_t __s1_869 = __p1_869; \ 70176 float16x8_t __s2_869 = __p2_869; \ 70177 __ret_869 = vfmlalq_low_f16(__s0_869, __s1_869, (float16x8_t) {vgetq_lane_f16(__s2_869, __p3_869), vgetq_lane_f16(__s2_869, __p3_869), vgetq_lane_f16(__s2_869, __p3_869), vgetq_lane_f16(__s2_869, __p3_869), vgetq_lane_f16(__s2_869, __p3_869), vgetq_lane_f16(__s2_869, __p3_869), vgetq_lane_f16(__s2_869, __p3_869), vgetq_lane_f16(__s2_869, __p3_869)}); \ 70178 __ret_869; \ 70179 }) 70180 #else 70181 #define vfmlalq_laneq_low_f16(__p0_870, __p1_870, __p2_870, __p3_870) __extension__ ({ \ 70182 float32x4_t __ret_870; \ 70183 float32x4_t __s0_870 = __p0_870; \ 70184 float16x8_t __s1_870 = __p1_870; \ 70185 float16x8_t __s2_870 = __p2_870; \ 70186 float32x4_t __rev0_870; __rev0_870 = __builtin_shufflevector(__s0_870, __s0_870, 3, 2, 1, 0); \ 70187 float16x8_t __rev1_870; __rev1_870 = __builtin_shufflevector(__s1_870, __s1_870, 7, 6, 5, 4, 3, 2, 1, 0); \ 70188 float16x8_t __rev2_870; __rev2_870 = __builtin_shufflevector(__s2_870, __s2_870, 7, 6, 5, 4, 3, 2, 1, 0); \ 70189 __ret_870 = __noswap_vfmlalq_low_f16(__rev0_870, __rev1_870, (float16x8_t) {__noswap_vgetq_lane_f16(__rev2_870, __p3_870), __noswap_vgetq_lane_f16(__rev2_870, __p3_870), __noswap_vgetq_lane_f16(__rev2_870, __p3_870), __noswap_vgetq_lane_f16(__rev2_870, __p3_870), __noswap_vgetq_lane_f16(__rev2_870, __p3_870), __noswap_vgetq_lane_f16(__rev2_870, __p3_870), __noswap_vgetq_lane_f16(__rev2_870, __p3_870), __noswap_vgetq_lane_f16(__rev2_870, __p3_870)}); \ 70190 __ret_870 = __builtin_shufflevector(__ret_870, __ret_870, 3, 2, 1, 0); \ 70191 __ret_870; \ 70192 }) 70193 #endif 70194 70195 #ifdef __LITTLE_ENDIAN__ 70196 #define vfmlal_laneq_low_f16(__p0_871, __p1_871, __p2_871, __p3_871) __extension__ ({ \ 70197 float32x2_t __ret_871; \ 70198 float32x2_t __s0_871 = __p0_871; \ 70199 float16x4_t __s1_871 = __p1_871; \ 70200 float16x8_t __s2_871 = __p2_871; \ 70201 __ret_871 = vfmlal_low_f16(__s0_871, __s1_871, (float16x4_t) {vgetq_lane_f16(__s2_871, __p3_871), vgetq_lane_f16(__s2_871, __p3_871), vgetq_lane_f16(__s2_871, __p3_871), vgetq_lane_f16(__s2_871, __p3_871)}); \ 70202 __ret_871; \ 70203 }) 70204 #else 70205 #define vfmlal_laneq_low_f16(__p0_872, __p1_872, __p2_872, __p3_872) __extension__ ({ \ 70206 float32x2_t __ret_872; \ 70207 float32x2_t __s0_872 = __p0_872; \ 70208 float16x4_t __s1_872 = __p1_872; \ 70209 float16x8_t __s2_872 = __p2_872; \ 70210 float32x2_t __rev0_872; __rev0_872 = __builtin_shufflevector(__s0_872, __s0_872, 1, 0); \ 70211 float16x4_t __rev1_872; __rev1_872 = __builtin_shufflevector(__s1_872, __s1_872, 3, 2, 1, 0); \ 70212 float16x8_t __rev2_872; __rev2_872 = __builtin_shufflevector(__s2_872, __s2_872, 7, 6, 5, 4, 3, 2, 1, 0); \ 70213 __ret_872 = __noswap_vfmlal_low_f16(__rev0_872, __rev1_872, (float16x4_t) {__noswap_vgetq_lane_f16(__rev2_872, __p3_872), __noswap_vgetq_lane_f16(__rev2_872, __p3_872), __noswap_vgetq_lane_f16(__rev2_872, __p3_872), __noswap_vgetq_lane_f16(__rev2_872, __p3_872)}); \ 70214 __ret_872 = __builtin_shufflevector(__ret_872, __ret_872, 1, 0); \ 70215 __ret_872; \ 70216 }) 70217 #endif 70218 70219 #ifdef __LITTLE_ENDIAN__ 70220 #define vfmlslq_lane_high_f16(__p0_873, __p1_873, __p2_873, __p3_873) __extension__ ({ \ 70221 float32x4_t __ret_873; \ 70222 float32x4_t __s0_873 = __p0_873; \ 70223 float16x8_t __s1_873 = __p1_873; \ 70224 float16x4_t __s2_873 = __p2_873; \ 70225 __ret_873 = vfmlslq_high_f16(__s0_873, __s1_873, (float16x8_t) {vget_lane_f16(__s2_873, __p3_873), vget_lane_f16(__s2_873, __p3_873), vget_lane_f16(__s2_873, __p3_873), vget_lane_f16(__s2_873, __p3_873), vget_lane_f16(__s2_873, __p3_873), vget_lane_f16(__s2_873, __p3_873), vget_lane_f16(__s2_873, __p3_873), vget_lane_f16(__s2_873, __p3_873)}); \ 70226 __ret_873; \ 70227 }) 70228 #else 70229 #define vfmlslq_lane_high_f16(__p0_874, __p1_874, __p2_874, __p3_874) __extension__ ({ \ 70230 float32x4_t __ret_874; \ 70231 float32x4_t __s0_874 = __p0_874; \ 70232 float16x8_t __s1_874 = __p1_874; \ 70233 float16x4_t __s2_874 = __p2_874; \ 70234 float32x4_t __rev0_874; __rev0_874 = __builtin_shufflevector(__s0_874, __s0_874, 3, 2, 1, 0); \ 70235 float16x8_t __rev1_874; __rev1_874 = __builtin_shufflevector(__s1_874, __s1_874, 7, 6, 5, 4, 3, 2, 1, 0); \ 70236 float16x4_t __rev2_874; __rev2_874 = __builtin_shufflevector(__s2_874, __s2_874, 3, 2, 1, 0); \ 70237 __ret_874 = __noswap_vfmlslq_high_f16(__rev0_874, __rev1_874, (float16x8_t) {__noswap_vget_lane_f16(__rev2_874, __p3_874), __noswap_vget_lane_f16(__rev2_874, __p3_874), __noswap_vget_lane_f16(__rev2_874, __p3_874), __noswap_vget_lane_f16(__rev2_874, __p3_874), __noswap_vget_lane_f16(__rev2_874, __p3_874), __noswap_vget_lane_f16(__rev2_874, __p3_874), __noswap_vget_lane_f16(__rev2_874, __p3_874), __noswap_vget_lane_f16(__rev2_874, __p3_874)}); \ 70238 __ret_874 = __builtin_shufflevector(__ret_874, __ret_874, 3, 2, 1, 0); \ 70239 __ret_874; \ 70240 }) 70241 #endif 70242 70243 #ifdef __LITTLE_ENDIAN__ 70244 #define vfmlsl_lane_high_f16(__p0_875, __p1_875, __p2_875, __p3_875) __extension__ ({ \ 70245 float32x2_t __ret_875; \ 70246 float32x2_t __s0_875 = __p0_875; \ 70247 float16x4_t __s1_875 = __p1_875; \ 70248 float16x4_t __s2_875 = __p2_875; \ 70249 __ret_875 = vfmlsl_high_f16(__s0_875, __s1_875, (float16x4_t) {vget_lane_f16(__s2_875, __p3_875), vget_lane_f16(__s2_875, __p3_875), vget_lane_f16(__s2_875, __p3_875), vget_lane_f16(__s2_875, __p3_875)}); \ 70250 __ret_875; \ 70251 }) 70252 #else 70253 #define vfmlsl_lane_high_f16(__p0_876, __p1_876, __p2_876, __p3_876) __extension__ ({ \ 70254 float32x2_t __ret_876; \ 70255 float32x2_t __s0_876 = __p0_876; \ 70256 float16x4_t __s1_876 = __p1_876; \ 70257 float16x4_t __s2_876 = __p2_876; \ 70258 float32x2_t __rev0_876; __rev0_876 = __builtin_shufflevector(__s0_876, __s0_876, 1, 0); \ 70259 float16x4_t __rev1_876; __rev1_876 = __builtin_shufflevector(__s1_876, __s1_876, 3, 2, 1, 0); \ 70260 float16x4_t __rev2_876; __rev2_876 = __builtin_shufflevector(__s2_876, __s2_876, 3, 2, 1, 0); \ 70261 __ret_876 = __noswap_vfmlsl_high_f16(__rev0_876, __rev1_876, (float16x4_t) {__noswap_vget_lane_f16(__rev2_876, __p3_876), __noswap_vget_lane_f16(__rev2_876, __p3_876), __noswap_vget_lane_f16(__rev2_876, __p3_876), __noswap_vget_lane_f16(__rev2_876, __p3_876)}); \ 70262 __ret_876 = __builtin_shufflevector(__ret_876, __ret_876, 1, 0); \ 70263 __ret_876; \ 70264 }) 70265 #endif 70266 70267 #ifdef __LITTLE_ENDIAN__ 70268 #define vfmlslq_lane_low_f16(__p0_877, __p1_877, __p2_877, __p3_877) __extension__ ({ \ 70269 float32x4_t __ret_877; \ 70270 float32x4_t __s0_877 = __p0_877; \ 70271 float16x8_t __s1_877 = __p1_877; \ 70272 float16x4_t __s2_877 = __p2_877; \ 70273 __ret_877 = vfmlslq_low_f16(__s0_877, __s1_877, (float16x8_t) {vget_lane_f16(__s2_877, __p3_877), vget_lane_f16(__s2_877, __p3_877), vget_lane_f16(__s2_877, __p3_877), vget_lane_f16(__s2_877, __p3_877), vget_lane_f16(__s2_877, __p3_877), vget_lane_f16(__s2_877, __p3_877), vget_lane_f16(__s2_877, __p3_877), vget_lane_f16(__s2_877, __p3_877)}); \ 70274 __ret_877; \ 70275 }) 70276 #else 70277 #define vfmlslq_lane_low_f16(__p0_878, __p1_878, __p2_878, __p3_878) __extension__ ({ \ 70278 float32x4_t __ret_878; \ 70279 float32x4_t __s0_878 = __p0_878; \ 70280 float16x8_t __s1_878 = __p1_878; \ 70281 float16x4_t __s2_878 = __p2_878; \ 70282 float32x4_t __rev0_878; __rev0_878 = __builtin_shufflevector(__s0_878, __s0_878, 3, 2, 1, 0); \ 70283 float16x8_t __rev1_878; __rev1_878 = __builtin_shufflevector(__s1_878, __s1_878, 7, 6, 5, 4, 3, 2, 1, 0); \ 70284 float16x4_t __rev2_878; __rev2_878 = __builtin_shufflevector(__s2_878, __s2_878, 3, 2, 1, 0); \ 70285 __ret_878 = __noswap_vfmlslq_low_f16(__rev0_878, __rev1_878, (float16x8_t) {__noswap_vget_lane_f16(__rev2_878, __p3_878), __noswap_vget_lane_f16(__rev2_878, __p3_878), __noswap_vget_lane_f16(__rev2_878, __p3_878), __noswap_vget_lane_f16(__rev2_878, __p3_878), __noswap_vget_lane_f16(__rev2_878, __p3_878), __noswap_vget_lane_f16(__rev2_878, __p3_878), __noswap_vget_lane_f16(__rev2_878, __p3_878), __noswap_vget_lane_f16(__rev2_878, __p3_878)}); \ 70286 __ret_878 = __builtin_shufflevector(__ret_878, __ret_878, 3, 2, 1, 0); \ 70287 __ret_878; \ 70288 }) 70289 #endif 70290 70291 #ifdef __LITTLE_ENDIAN__ 70292 #define vfmlsl_lane_low_f16(__p0_879, __p1_879, __p2_879, __p3_879) __extension__ ({ \ 70293 float32x2_t __ret_879; \ 70294 float32x2_t __s0_879 = __p0_879; \ 70295 float16x4_t __s1_879 = __p1_879; \ 70296 float16x4_t __s2_879 = __p2_879; \ 70297 __ret_879 = vfmlsl_low_f16(__s0_879, __s1_879, (float16x4_t) {vget_lane_f16(__s2_879, __p3_879), vget_lane_f16(__s2_879, __p3_879), vget_lane_f16(__s2_879, __p3_879), vget_lane_f16(__s2_879, __p3_879)}); \ 70298 __ret_879; \ 70299 }) 70300 #else 70301 #define vfmlsl_lane_low_f16(__p0_880, __p1_880, __p2_880, __p3_880) __extension__ ({ \ 70302 float32x2_t __ret_880; \ 70303 float32x2_t __s0_880 = __p0_880; \ 70304 float16x4_t __s1_880 = __p1_880; \ 70305 float16x4_t __s2_880 = __p2_880; \ 70306 float32x2_t __rev0_880; __rev0_880 = __builtin_shufflevector(__s0_880, __s0_880, 1, 0); \ 70307 float16x4_t __rev1_880; __rev1_880 = __builtin_shufflevector(__s1_880, __s1_880, 3, 2, 1, 0); \ 70308 float16x4_t __rev2_880; __rev2_880 = __builtin_shufflevector(__s2_880, __s2_880, 3, 2, 1, 0); \ 70309 __ret_880 = __noswap_vfmlsl_low_f16(__rev0_880, __rev1_880, (float16x4_t) {__noswap_vget_lane_f16(__rev2_880, __p3_880), __noswap_vget_lane_f16(__rev2_880, __p3_880), __noswap_vget_lane_f16(__rev2_880, __p3_880), __noswap_vget_lane_f16(__rev2_880, __p3_880)}); \ 70310 __ret_880 = __builtin_shufflevector(__ret_880, __ret_880, 1, 0); \ 70311 __ret_880; \ 70312 }) 70313 #endif 70314 70315 #ifdef __LITTLE_ENDIAN__ 70316 #define vfmlslq_laneq_high_f16(__p0_881, __p1_881, __p2_881, __p3_881) __extension__ ({ \ 70317 float32x4_t __ret_881; \ 70318 float32x4_t __s0_881 = __p0_881; \ 70319 float16x8_t __s1_881 = __p1_881; \ 70320 float16x8_t __s2_881 = __p2_881; \ 70321 __ret_881 = vfmlslq_high_f16(__s0_881, __s1_881, (float16x8_t) {vgetq_lane_f16(__s2_881, __p3_881), vgetq_lane_f16(__s2_881, __p3_881), vgetq_lane_f16(__s2_881, __p3_881), vgetq_lane_f16(__s2_881, __p3_881), vgetq_lane_f16(__s2_881, __p3_881), vgetq_lane_f16(__s2_881, __p3_881), vgetq_lane_f16(__s2_881, __p3_881), vgetq_lane_f16(__s2_881, __p3_881)}); \ 70322 __ret_881; \ 70323 }) 70324 #else 70325 #define vfmlslq_laneq_high_f16(__p0_882, __p1_882, __p2_882, __p3_882) __extension__ ({ \ 70326 float32x4_t __ret_882; \ 70327 float32x4_t __s0_882 = __p0_882; \ 70328 float16x8_t __s1_882 = __p1_882; \ 70329 float16x8_t __s2_882 = __p2_882; \ 70330 float32x4_t __rev0_882; __rev0_882 = __builtin_shufflevector(__s0_882, __s0_882, 3, 2, 1, 0); \ 70331 float16x8_t __rev1_882; __rev1_882 = __builtin_shufflevector(__s1_882, __s1_882, 7, 6, 5, 4, 3, 2, 1, 0); \ 70332 float16x8_t __rev2_882; __rev2_882 = __builtin_shufflevector(__s2_882, __s2_882, 7, 6, 5, 4, 3, 2, 1, 0); \ 70333 __ret_882 = __noswap_vfmlslq_high_f16(__rev0_882, __rev1_882, (float16x8_t) {__noswap_vgetq_lane_f16(__rev2_882, __p3_882), __noswap_vgetq_lane_f16(__rev2_882, __p3_882), __noswap_vgetq_lane_f16(__rev2_882, __p3_882), __noswap_vgetq_lane_f16(__rev2_882, __p3_882), __noswap_vgetq_lane_f16(__rev2_882, __p3_882), __noswap_vgetq_lane_f16(__rev2_882, __p3_882), __noswap_vgetq_lane_f16(__rev2_882, __p3_882), __noswap_vgetq_lane_f16(__rev2_882, __p3_882)}); \ 70334 __ret_882 = __builtin_shufflevector(__ret_882, __ret_882, 3, 2, 1, 0); \ 70335 __ret_882; \ 70336 }) 70337 #endif 70338 70339 #ifdef __LITTLE_ENDIAN__ 70340 #define vfmlsl_laneq_high_f16(__p0_883, __p1_883, __p2_883, __p3_883) __extension__ ({ \ 70341 float32x2_t __ret_883; \ 70342 float32x2_t __s0_883 = __p0_883; \ 70343 float16x4_t __s1_883 = __p1_883; \ 70344 float16x8_t __s2_883 = __p2_883; \ 70345 __ret_883 = vfmlsl_high_f16(__s0_883, __s1_883, (float16x4_t) {vgetq_lane_f16(__s2_883, __p3_883), vgetq_lane_f16(__s2_883, __p3_883), vgetq_lane_f16(__s2_883, __p3_883), vgetq_lane_f16(__s2_883, __p3_883)}); \ 70346 __ret_883; \ 70347 }) 70348 #else 70349 #define vfmlsl_laneq_high_f16(__p0_884, __p1_884, __p2_884, __p3_884) __extension__ ({ \ 70350 float32x2_t __ret_884; \ 70351 float32x2_t __s0_884 = __p0_884; \ 70352 float16x4_t __s1_884 = __p1_884; \ 70353 float16x8_t __s2_884 = __p2_884; \ 70354 float32x2_t __rev0_884; __rev0_884 = __builtin_shufflevector(__s0_884, __s0_884, 1, 0); \ 70355 float16x4_t __rev1_884; __rev1_884 = __builtin_shufflevector(__s1_884, __s1_884, 3, 2, 1, 0); \ 70356 float16x8_t __rev2_884; __rev2_884 = __builtin_shufflevector(__s2_884, __s2_884, 7, 6, 5, 4, 3, 2, 1, 0); \ 70357 __ret_884 = __noswap_vfmlsl_high_f16(__rev0_884, __rev1_884, (float16x4_t) {__noswap_vgetq_lane_f16(__rev2_884, __p3_884), __noswap_vgetq_lane_f16(__rev2_884, __p3_884), __noswap_vgetq_lane_f16(__rev2_884, __p3_884), __noswap_vgetq_lane_f16(__rev2_884, __p3_884)}); \ 70358 __ret_884 = __builtin_shufflevector(__ret_884, __ret_884, 1, 0); \ 70359 __ret_884; \ 70360 }) 70361 #endif 70362 70363 #ifdef __LITTLE_ENDIAN__ 70364 #define vfmlslq_laneq_low_f16(__p0_885, __p1_885, __p2_885, __p3_885) __extension__ ({ \ 70365 float32x4_t __ret_885; \ 70366 float32x4_t __s0_885 = __p0_885; \ 70367 float16x8_t __s1_885 = __p1_885; \ 70368 float16x8_t __s2_885 = __p2_885; \ 70369 __ret_885 = vfmlslq_low_f16(__s0_885, __s1_885, (float16x8_t) {vgetq_lane_f16(__s2_885, __p3_885), vgetq_lane_f16(__s2_885, __p3_885), vgetq_lane_f16(__s2_885, __p3_885), vgetq_lane_f16(__s2_885, __p3_885), vgetq_lane_f16(__s2_885, __p3_885), vgetq_lane_f16(__s2_885, __p3_885), vgetq_lane_f16(__s2_885, __p3_885), vgetq_lane_f16(__s2_885, __p3_885)}); \ 70370 __ret_885; \ 70371 }) 70372 #else 70373 #define vfmlslq_laneq_low_f16(__p0_886, __p1_886, __p2_886, __p3_886) __extension__ ({ \ 70374 float32x4_t __ret_886; \ 70375 float32x4_t __s0_886 = __p0_886; \ 70376 float16x8_t __s1_886 = __p1_886; \ 70377 float16x8_t __s2_886 = __p2_886; \ 70378 float32x4_t __rev0_886; __rev0_886 = __builtin_shufflevector(__s0_886, __s0_886, 3, 2, 1, 0); \ 70379 float16x8_t __rev1_886; __rev1_886 = __builtin_shufflevector(__s1_886, __s1_886, 7, 6, 5, 4, 3, 2, 1, 0); \ 70380 float16x8_t __rev2_886; __rev2_886 = __builtin_shufflevector(__s2_886, __s2_886, 7, 6, 5, 4, 3, 2, 1, 0); \ 70381 __ret_886 = __noswap_vfmlslq_low_f16(__rev0_886, __rev1_886, (float16x8_t) {__noswap_vgetq_lane_f16(__rev2_886, __p3_886), __noswap_vgetq_lane_f16(__rev2_886, __p3_886), __noswap_vgetq_lane_f16(__rev2_886, __p3_886), __noswap_vgetq_lane_f16(__rev2_886, __p3_886), __noswap_vgetq_lane_f16(__rev2_886, __p3_886), __noswap_vgetq_lane_f16(__rev2_886, __p3_886), __noswap_vgetq_lane_f16(__rev2_886, __p3_886), __noswap_vgetq_lane_f16(__rev2_886, __p3_886)}); \ 70382 __ret_886 = __builtin_shufflevector(__ret_886, __ret_886, 3, 2, 1, 0); \ 70383 __ret_886; \ 70384 }) 70385 #endif 70386 70387 #ifdef __LITTLE_ENDIAN__ 70388 #define vfmlsl_laneq_low_f16(__p0_887, __p1_887, __p2_887, __p3_887) __extension__ ({ \ 70389 float32x2_t __ret_887; \ 70390 float32x2_t __s0_887 = __p0_887; \ 70391 float16x4_t __s1_887 = __p1_887; \ 70392 float16x8_t __s2_887 = __p2_887; \ 70393 __ret_887 = vfmlsl_low_f16(__s0_887, __s1_887, (float16x4_t) {vgetq_lane_f16(__s2_887, __p3_887), vgetq_lane_f16(__s2_887, __p3_887), vgetq_lane_f16(__s2_887, __p3_887), vgetq_lane_f16(__s2_887, __p3_887)}); \ 70394 __ret_887; \ 70395 }) 70396 #else 70397 #define vfmlsl_laneq_low_f16(__p0_888, __p1_888, __p2_888, __p3_888) __extension__ ({ \ 70398 float32x2_t __ret_888; \ 70399 float32x2_t __s0_888 = __p0_888; \ 70400 float16x4_t __s1_888 = __p1_888; \ 70401 float16x8_t __s2_888 = __p2_888; \ 70402 float32x2_t __rev0_888; __rev0_888 = __builtin_shufflevector(__s0_888, __s0_888, 1, 0); \ 70403 float16x4_t __rev1_888; __rev1_888 = __builtin_shufflevector(__s1_888, __s1_888, 3, 2, 1, 0); \ 70404 float16x8_t __rev2_888; __rev2_888 = __builtin_shufflevector(__s2_888, __s2_888, 7, 6, 5, 4, 3, 2, 1, 0); \ 70405 __ret_888 = __noswap_vfmlsl_low_f16(__rev0_888, __rev1_888, (float16x4_t) {__noswap_vgetq_lane_f16(__rev2_888, __p3_888), __noswap_vgetq_lane_f16(__rev2_888, __p3_888), __noswap_vgetq_lane_f16(__rev2_888, __p3_888), __noswap_vgetq_lane_f16(__rev2_888, __p3_888)}); \ 70406 __ret_888 = __builtin_shufflevector(__ret_888, __ret_888, 1, 0); \ 70407 __ret_888; \ 70408 }) 70409 #endif 70410 70411 #ifdef __LITTLE_ENDIAN__ 70412 #define vmulh_lane_f16(__p0_889, __p1_889, __p2_889) __extension__ ({ \ 70413 float16_t __ret_889; \ 70414 float16_t __s0_889 = __p0_889; \ 70415 float16x4_t __s1_889 = __p1_889; \ 70416 __ret_889 = __s0_889 * vget_lane_f16(__s1_889, __p2_889); \ 70417 __ret_889; \ 70418 }) 70419 #else 70420 #define vmulh_lane_f16(__p0_890, __p1_890, __p2_890) __extension__ ({ \ 70421 float16_t __ret_890; \ 70422 float16_t __s0_890 = __p0_890; \ 70423 float16x4_t __s1_890 = __p1_890; \ 70424 float16x4_t __rev1_890; __rev1_890 = __builtin_shufflevector(__s1_890, __s1_890, 3, 2, 1, 0); \ 70425 __ret_890 = __s0_890 * __noswap_vget_lane_f16(__rev1_890, __p2_890); \ 70426 __ret_890; \ 70427 }) 70428 #endif 70429 70430 #ifdef __LITTLE_ENDIAN__ 70431 #define vmulh_laneq_f16(__p0_891, __p1_891, __p2_891) __extension__ ({ \ 70432 float16_t __ret_891; \ 70433 float16_t __s0_891 = __p0_891; \ 70434 float16x8_t __s1_891 = __p1_891; \ 70435 __ret_891 = __s0_891 * vgetq_lane_f16(__s1_891, __p2_891); \ 70436 __ret_891; \ 70437 }) 70438 #else 70439 #define vmulh_laneq_f16(__p0_892, __p1_892, __p2_892) __extension__ ({ \ 70440 float16_t __ret_892; \ 70441 float16_t __s0_892 = __p0_892; \ 70442 float16x8_t __s1_892 = __p1_892; \ 70443 float16x8_t __rev1_892; __rev1_892 = __builtin_shufflevector(__s1_892, __s1_892, 7, 6, 5, 4, 3, 2, 1, 0); \ 70444 __ret_892 = __s0_892 * __noswap_vgetq_lane_f16(__rev1_892, __p2_892); \ 70445 __ret_892; \ 70446 }) 70447 #endif 70448 70449 #ifdef __LITTLE_ENDIAN__ 70450 __ai __attribute__((target("neon"))) uint16x8_t vabdl_high_u8(uint8x16_t __p0, uint8x16_t __p1) { 70451 uint16x8_t __ret; 70452 __ret = vabdl_u8(vget_high_u8(__p0), vget_high_u8(__p1)); 70453 return __ret; 70454 } 70455 #else 70456 __ai __attribute__((target("neon"))) uint16x8_t vabdl_high_u8(uint8x16_t __p0, uint8x16_t __p1) { 70457 uint16x8_t __ret; 70458 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 70459 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 70460 __ret = __noswap_vabdl_u8(__noswap_vget_high_u8(__rev0), __noswap_vget_high_u8(__rev1)); 70461 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 70462 return __ret; 70463 } 70464 #endif 70465 70466 #ifdef __LITTLE_ENDIAN__ 70467 __ai __attribute__((target("neon"))) uint64x2_t vabdl_high_u32(uint32x4_t __p0, uint32x4_t __p1) { 70468 uint64x2_t __ret; 70469 __ret = vabdl_u32(vget_high_u32(__p0), vget_high_u32(__p1)); 70470 return __ret; 70471 } 70472 #else 70473 __ai __attribute__((target("neon"))) uint64x2_t vabdl_high_u32(uint32x4_t __p0, uint32x4_t __p1) { 70474 uint64x2_t __ret; 70475 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 70476 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 70477 __ret = __noswap_vabdl_u32(__noswap_vget_high_u32(__rev0), __noswap_vget_high_u32(__rev1)); 70478 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 70479 return __ret; 70480 } 70481 #endif 70482 70483 #ifdef __LITTLE_ENDIAN__ 70484 __ai __attribute__((target("neon"))) uint32x4_t vabdl_high_u16(uint16x8_t __p0, uint16x8_t __p1) { 70485 uint32x4_t __ret; 70486 __ret = vabdl_u16(vget_high_u16(__p0), vget_high_u16(__p1)); 70487 return __ret; 70488 } 70489 #else 70490 __ai __attribute__((target("neon"))) uint32x4_t vabdl_high_u16(uint16x8_t __p0, uint16x8_t __p1) { 70491 uint32x4_t __ret; 70492 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 70493 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 70494 __ret = __noswap_vabdl_u16(__noswap_vget_high_u16(__rev0), __noswap_vget_high_u16(__rev1)); 70495 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 70496 return __ret; 70497 } 70498 #endif 70499 70500 #ifdef __LITTLE_ENDIAN__ 70501 __ai __attribute__((target("neon"))) int16x8_t vabdl_high_s8(int8x16_t __p0, int8x16_t __p1) { 70502 int16x8_t __ret; 70503 __ret = vabdl_s8(vget_high_s8(__p0), vget_high_s8(__p1)); 70504 return __ret; 70505 } 70506 #else 70507 __ai __attribute__((target("neon"))) int16x8_t vabdl_high_s8(int8x16_t __p0, int8x16_t __p1) { 70508 int16x8_t __ret; 70509 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 70510 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 70511 __ret = __noswap_vabdl_s8(__noswap_vget_high_s8(__rev0), __noswap_vget_high_s8(__rev1)); 70512 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 70513 return __ret; 70514 } 70515 #endif 70516 70517 #ifdef __LITTLE_ENDIAN__ 70518 __ai __attribute__((target("neon"))) int64x2_t vabdl_high_s32(int32x4_t __p0, int32x4_t __p1) { 70519 int64x2_t __ret; 70520 __ret = vabdl_s32(vget_high_s32(__p0), vget_high_s32(__p1)); 70521 return __ret; 70522 } 70523 #else 70524 __ai __attribute__((target("neon"))) int64x2_t vabdl_high_s32(int32x4_t __p0, int32x4_t __p1) { 70525 int64x2_t __ret; 70526 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 70527 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 70528 __ret = __noswap_vabdl_s32(__noswap_vget_high_s32(__rev0), __noswap_vget_high_s32(__rev1)); 70529 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 70530 return __ret; 70531 } 70532 #endif 70533 70534 #ifdef __LITTLE_ENDIAN__ 70535 __ai __attribute__((target("neon"))) int32x4_t vabdl_high_s16(int16x8_t __p0, int16x8_t __p1) { 70536 int32x4_t __ret; 70537 __ret = vabdl_s16(vget_high_s16(__p0), vget_high_s16(__p1)); 70538 return __ret; 70539 } 70540 #else 70541 __ai __attribute__((target("neon"))) int32x4_t vabdl_high_s16(int16x8_t __p0, int16x8_t __p1) { 70542 int32x4_t __ret; 70543 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 70544 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 70545 __ret = __noswap_vabdl_s16(__noswap_vget_high_s16(__rev0), __noswap_vget_high_s16(__rev1)); 70546 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 70547 return __ret; 70548 } 70549 #endif 70550 70551 #ifdef __LITTLE_ENDIAN__ 70552 __ai __attribute__((target("neon"))) uint16x8_t vaddl_high_u8(uint8x16_t __p0, uint8x16_t __p1) { 70553 uint16x8_t __ret; 70554 __ret = vmovl_high_u8(__p0) + vmovl_high_u8(__p1); 70555 return __ret; 70556 } 70557 #else 70558 __ai __attribute__((target("neon"))) uint16x8_t vaddl_high_u8(uint8x16_t __p0, uint8x16_t __p1) { 70559 uint16x8_t __ret; 70560 uint8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 70561 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 70562 __ret = __noswap_vmovl_high_u8(__rev0) + __noswap_vmovl_high_u8(__rev1); 70563 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 70564 return __ret; 70565 } 70566 #endif 70567 70568 #ifdef __LITTLE_ENDIAN__ 70569 __ai __attribute__((target("neon"))) uint64x2_t vaddl_high_u32(uint32x4_t __p0, uint32x4_t __p1) { 70570 uint64x2_t __ret; 70571 __ret = vmovl_high_u32(__p0) + vmovl_high_u32(__p1); 70572 return __ret; 70573 } 70574 #else 70575 __ai __attribute__((target("neon"))) uint64x2_t vaddl_high_u32(uint32x4_t __p0, uint32x4_t __p1) { 70576 uint64x2_t __ret; 70577 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 70578 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 70579 __ret = __noswap_vmovl_high_u32(__rev0) + __noswap_vmovl_high_u32(__rev1); 70580 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 70581 return __ret; 70582 } 70583 #endif 70584 70585 #ifdef __LITTLE_ENDIAN__ 70586 __ai __attribute__((target("neon"))) uint32x4_t vaddl_high_u16(uint16x8_t __p0, uint16x8_t __p1) { 70587 uint32x4_t __ret; 70588 __ret = vmovl_high_u16(__p0) + vmovl_high_u16(__p1); 70589 return __ret; 70590 } 70591 #else 70592 __ai __attribute__((target("neon"))) uint32x4_t vaddl_high_u16(uint16x8_t __p0, uint16x8_t __p1) { 70593 uint32x4_t __ret; 70594 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 70595 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 70596 __ret = __noswap_vmovl_high_u16(__rev0) + __noswap_vmovl_high_u16(__rev1); 70597 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 70598 return __ret; 70599 } 70600 #endif 70601 70602 #ifdef __LITTLE_ENDIAN__ 70603 __ai __attribute__((target("neon"))) int16x8_t vaddl_high_s8(int8x16_t __p0, int8x16_t __p1) { 70604 int16x8_t __ret; 70605 __ret = vmovl_high_s8(__p0) + vmovl_high_s8(__p1); 70606 return __ret; 70607 } 70608 #else 70609 __ai __attribute__((target("neon"))) int16x8_t vaddl_high_s8(int8x16_t __p0, int8x16_t __p1) { 70610 int16x8_t __ret; 70611 int8x16_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 70612 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 70613 __ret = __noswap_vmovl_high_s8(__rev0) + __noswap_vmovl_high_s8(__rev1); 70614 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 70615 return __ret; 70616 } 70617 #endif 70618 70619 #ifdef __LITTLE_ENDIAN__ 70620 __ai __attribute__((target("neon"))) int64x2_t vaddl_high_s32(int32x4_t __p0, int32x4_t __p1) { 70621 int64x2_t __ret; 70622 __ret = vmovl_high_s32(__p0) + vmovl_high_s32(__p1); 70623 return __ret; 70624 } 70625 #else 70626 __ai __attribute__((target("neon"))) int64x2_t vaddl_high_s32(int32x4_t __p0, int32x4_t __p1) { 70627 int64x2_t __ret; 70628 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 70629 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 70630 __ret = __noswap_vmovl_high_s32(__rev0) + __noswap_vmovl_high_s32(__rev1); 70631 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 70632 return __ret; 70633 } 70634 #endif 70635 70636 #ifdef __LITTLE_ENDIAN__ 70637 __ai __attribute__((target("neon"))) int32x4_t vaddl_high_s16(int16x8_t __p0, int16x8_t __p1) { 70638 int32x4_t __ret; 70639 __ret = vmovl_high_s16(__p0) + vmovl_high_s16(__p1); 70640 return __ret; 70641 } 70642 #else 70643 __ai __attribute__((target("neon"))) int32x4_t vaddl_high_s16(int16x8_t __p0, int16x8_t __p1) { 70644 int32x4_t __ret; 70645 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 70646 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 70647 __ret = __noswap_vmovl_high_s16(__rev0) + __noswap_vmovl_high_s16(__rev1); 70648 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 70649 return __ret; 70650 } 70651 #endif 70652 70653 #ifdef __LITTLE_ENDIAN__ 70654 __ai __attribute__((target("neon"))) uint16x8_t vaddw_high_u8(uint16x8_t __p0, uint8x16_t __p1) { 70655 uint16x8_t __ret; 70656 __ret = __p0 + vmovl_high_u8(__p1); 70657 return __ret; 70658 } 70659 #else 70660 __ai __attribute__((target("neon"))) uint16x8_t vaddw_high_u8(uint16x8_t __p0, uint8x16_t __p1) { 70661 uint16x8_t __ret; 70662 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 70663 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 70664 __ret = __rev0 + __noswap_vmovl_high_u8(__rev1); 70665 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 70666 return __ret; 70667 } 70668 #endif 70669 70670 #ifdef __LITTLE_ENDIAN__ 70671 __ai __attribute__((target("neon"))) uint64x2_t vaddw_high_u32(uint64x2_t __p0, uint32x4_t __p1) { 70672 uint64x2_t __ret; 70673 __ret = __p0 + vmovl_high_u32(__p1); 70674 return __ret; 70675 } 70676 #else 70677 __ai __attribute__((target("neon"))) uint64x2_t vaddw_high_u32(uint64x2_t __p0, uint32x4_t __p1) { 70678 uint64x2_t __ret; 70679 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 70680 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 70681 __ret = __rev0 + __noswap_vmovl_high_u32(__rev1); 70682 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 70683 return __ret; 70684 } 70685 #endif 70686 70687 #ifdef __LITTLE_ENDIAN__ 70688 __ai __attribute__((target("neon"))) uint32x4_t vaddw_high_u16(uint32x4_t __p0, uint16x8_t __p1) { 70689 uint32x4_t __ret; 70690 __ret = __p0 + vmovl_high_u16(__p1); 70691 return __ret; 70692 } 70693 #else 70694 __ai __attribute__((target("neon"))) uint32x4_t vaddw_high_u16(uint32x4_t __p0, uint16x8_t __p1) { 70695 uint32x4_t __ret; 70696 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 70697 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 70698 __ret = __rev0 + __noswap_vmovl_high_u16(__rev1); 70699 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 70700 return __ret; 70701 } 70702 #endif 70703 70704 #ifdef __LITTLE_ENDIAN__ 70705 __ai __attribute__((target("neon"))) int16x8_t vaddw_high_s8(int16x8_t __p0, int8x16_t __p1) { 70706 int16x8_t __ret; 70707 __ret = __p0 + vmovl_high_s8(__p1); 70708 return __ret; 70709 } 70710 #else 70711 __ai __attribute__((target("neon"))) int16x8_t vaddw_high_s8(int16x8_t __p0, int8x16_t __p1) { 70712 int16x8_t __ret; 70713 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 70714 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 70715 __ret = __rev0 + __noswap_vmovl_high_s8(__rev1); 70716 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 70717 return __ret; 70718 } 70719 #endif 70720 70721 #ifdef __LITTLE_ENDIAN__ 70722 __ai __attribute__((target("neon"))) int64x2_t vaddw_high_s32(int64x2_t __p0, int32x4_t __p1) { 70723 int64x2_t __ret; 70724 __ret = __p0 + vmovl_high_s32(__p1); 70725 return __ret; 70726 } 70727 #else 70728 __ai __attribute__((target("neon"))) int64x2_t vaddw_high_s32(int64x2_t __p0, int32x4_t __p1) { 70729 int64x2_t __ret; 70730 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 70731 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 70732 __ret = __rev0 + __noswap_vmovl_high_s32(__rev1); 70733 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 70734 return __ret; 70735 } 70736 #endif 70737 70738 #ifdef __LITTLE_ENDIAN__ 70739 __ai __attribute__((target("neon"))) int32x4_t vaddw_high_s16(int32x4_t __p0, int16x8_t __p1) { 70740 int32x4_t __ret; 70741 __ret = __p0 + vmovl_high_s16(__p1); 70742 return __ret; 70743 } 70744 #else 70745 __ai __attribute__((target("neon"))) int32x4_t vaddw_high_s16(int32x4_t __p0, int16x8_t __p1) { 70746 int32x4_t __ret; 70747 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 70748 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 70749 __ret = __rev0 + __noswap_vmovl_high_s16(__rev1); 70750 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 70751 return __ret; 70752 } 70753 #endif 70754 70755 #ifdef __LITTLE_ENDIAN__ 70756 #define vcopyq_lane_p64(__p0_893, __p1_893, __p2_893, __p3_893) __extension__ ({ \ 70757 poly64x2_t __ret_893; \ 70758 poly64x2_t __s0_893 = __p0_893; \ 70759 poly64x1_t __s2_893 = __p2_893; \ 70760 __ret_893 = vsetq_lane_p64(vget_lane_p64(__s2_893, __p3_893), __s0_893, __p1_893); \ 70761 __ret_893; \ 70762 }) 70763 #else 70764 #define vcopyq_lane_p64(__p0_894, __p1_894, __p2_894, __p3_894) __extension__ ({ \ 70765 poly64x2_t __ret_894; \ 70766 poly64x2_t __s0_894 = __p0_894; \ 70767 poly64x1_t __s2_894 = __p2_894; \ 70768 poly64x2_t __rev0_894; __rev0_894 = __builtin_shufflevector(__s0_894, __s0_894, 1, 0); \ 70769 __ret_894 = __noswap_vsetq_lane_p64(vget_lane_p64(__s2_894, __p3_894), __rev0_894, __p1_894); \ 70770 __ret_894 = __builtin_shufflevector(__ret_894, __ret_894, 1, 0); \ 70771 __ret_894; \ 70772 }) 70773 #endif 70774 70775 #ifdef __LITTLE_ENDIAN__ 70776 #define vcopyq_lane_f64(__p0_895, __p1_895, __p2_895, __p3_895) __extension__ ({ \ 70777 float64x2_t __ret_895; \ 70778 float64x2_t __s0_895 = __p0_895; \ 70779 float64x1_t __s2_895 = __p2_895; \ 70780 __ret_895 = vsetq_lane_f64(vget_lane_f64(__s2_895, __p3_895), __s0_895, __p1_895); \ 70781 __ret_895; \ 70782 }) 70783 #else 70784 #define vcopyq_lane_f64(__p0_896, __p1_896, __p2_896, __p3_896) __extension__ ({ \ 70785 float64x2_t __ret_896; \ 70786 float64x2_t __s0_896 = __p0_896; \ 70787 float64x1_t __s2_896 = __p2_896; \ 70788 float64x2_t __rev0_896; __rev0_896 = __builtin_shufflevector(__s0_896, __s0_896, 1, 0); \ 70789 __ret_896 = __noswap_vsetq_lane_f64(vget_lane_f64(__s2_896, __p3_896), __rev0_896, __p1_896); \ 70790 __ret_896 = __builtin_shufflevector(__ret_896, __ret_896, 1, 0); \ 70791 __ret_896; \ 70792 }) 70793 #endif 70794 70795 #define vcopy_lane_p64(__p0_897, __p1_897, __p2_897, __p3_897) __extension__ ({ \ 70796 poly64x1_t __ret_897; \ 70797 poly64x1_t __s0_897 = __p0_897; \ 70798 poly64x1_t __s2_897 = __p2_897; \ 70799 __ret_897 = vset_lane_p64(vget_lane_p64(__s2_897, __p3_897), __s0_897, __p1_897); \ 70800 __ret_897; \ 70801 }) 70802 #define vcopy_lane_f64(__p0_898, __p1_898, __p2_898, __p3_898) __extension__ ({ \ 70803 float64x1_t __ret_898; \ 70804 float64x1_t __s0_898 = __p0_898; \ 70805 float64x1_t __s2_898 = __p2_898; \ 70806 __ret_898 = vset_lane_f64(vget_lane_f64(__s2_898, __p3_898), __s0_898, __p1_898); \ 70807 __ret_898; \ 70808 }) 70809 #ifdef __LITTLE_ENDIAN__ 70810 #define vcopyq_laneq_p64(__p0_899, __p1_899, __p2_899, __p3_899) __extension__ ({ \ 70811 poly64x2_t __ret_899; \ 70812 poly64x2_t __s0_899 = __p0_899; \ 70813 poly64x2_t __s2_899 = __p2_899; \ 70814 __ret_899 = vsetq_lane_p64(vgetq_lane_p64(__s2_899, __p3_899), __s0_899, __p1_899); \ 70815 __ret_899; \ 70816 }) 70817 #else 70818 #define vcopyq_laneq_p64(__p0_900, __p1_900, __p2_900, __p3_900) __extension__ ({ \ 70819 poly64x2_t __ret_900; \ 70820 poly64x2_t __s0_900 = __p0_900; \ 70821 poly64x2_t __s2_900 = __p2_900; \ 70822 poly64x2_t __rev0_900; __rev0_900 = __builtin_shufflevector(__s0_900, __s0_900, 1, 0); \ 70823 poly64x2_t __rev2_900; __rev2_900 = __builtin_shufflevector(__s2_900, __s2_900, 1, 0); \ 70824 __ret_900 = __noswap_vsetq_lane_p64(__noswap_vgetq_lane_p64(__rev2_900, __p3_900), __rev0_900, __p1_900); \ 70825 __ret_900 = __builtin_shufflevector(__ret_900, __ret_900, 1, 0); \ 70826 __ret_900; \ 70827 }) 70828 #endif 70829 70830 #ifdef __LITTLE_ENDIAN__ 70831 #define vcopyq_laneq_f64(__p0_901, __p1_901, __p2_901, __p3_901) __extension__ ({ \ 70832 float64x2_t __ret_901; \ 70833 float64x2_t __s0_901 = __p0_901; \ 70834 float64x2_t __s2_901 = __p2_901; \ 70835 __ret_901 = vsetq_lane_f64(vgetq_lane_f64(__s2_901, __p3_901), __s0_901, __p1_901); \ 70836 __ret_901; \ 70837 }) 70838 #else 70839 #define vcopyq_laneq_f64(__p0_902, __p1_902, __p2_902, __p3_902) __extension__ ({ \ 70840 float64x2_t __ret_902; \ 70841 float64x2_t __s0_902 = __p0_902; \ 70842 float64x2_t __s2_902 = __p2_902; \ 70843 float64x2_t __rev0_902; __rev0_902 = __builtin_shufflevector(__s0_902, __s0_902, 1, 0); \ 70844 float64x2_t __rev2_902; __rev2_902 = __builtin_shufflevector(__s2_902, __s2_902, 1, 0); \ 70845 __ret_902 = __noswap_vsetq_lane_f64(__noswap_vgetq_lane_f64(__rev2_902, __p3_902), __rev0_902, __p1_902); \ 70846 __ret_902 = __builtin_shufflevector(__ret_902, __ret_902, 1, 0); \ 70847 __ret_902; \ 70848 }) 70849 #endif 70850 70851 #ifdef __LITTLE_ENDIAN__ 70852 #define vcopy_laneq_p64(__p0_903, __p1_903, __p2_903, __p3_903) __extension__ ({ \ 70853 poly64x1_t __ret_903; \ 70854 poly64x1_t __s0_903 = __p0_903; \ 70855 poly64x2_t __s2_903 = __p2_903; \ 70856 __ret_903 = vset_lane_p64(vgetq_lane_p64(__s2_903, __p3_903), __s0_903, __p1_903); \ 70857 __ret_903; \ 70858 }) 70859 #else 70860 #define vcopy_laneq_p64(__p0_904, __p1_904, __p2_904, __p3_904) __extension__ ({ \ 70861 poly64x1_t __ret_904; \ 70862 poly64x1_t __s0_904 = __p0_904; \ 70863 poly64x2_t __s2_904 = __p2_904; \ 70864 poly64x2_t __rev2_904; __rev2_904 = __builtin_shufflevector(__s2_904, __s2_904, 1, 0); \ 70865 __ret_904 = vset_lane_p64(__noswap_vgetq_lane_p64(__rev2_904, __p3_904), __s0_904, __p1_904); \ 70866 __ret_904; \ 70867 }) 70868 #endif 70869 70870 #ifdef __LITTLE_ENDIAN__ 70871 #define vcopy_laneq_f64(__p0_905, __p1_905, __p2_905, __p3_905) __extension__ ({ \ 70872 float64x1_t __ret_905; \ 70873 float64x1_t __s0_905 = __p0_905; \ 70874 float64x2_t __s2_905 = __p2_905; \ 70875 __ret_905 = vset_lane_f64(vgetq_lane_f64(__s2_905, __p3_905), __s0_905, __p1_905); \ 70876 __ret_905; \ 70877 }) 70878 #else 70879 #define vcopy_laneq_f64(__p0_906, __p1_906, __p2_906, __p3_906) __extension__ ({ \ 70880 float64x1_t __ret_906; \ 70881 float64x1_t __s0_906 = __p0_906; \ 70882 float64x2_t __s2_906 = __p2_906; \ 70883 float64x2_t __rev2_906; __rev2_906 = __builtin_shufflevector(__s2_906, __s2_906, 1, 0); \ 70884 __ret_906 = vset_lane_f64(__noswap_vgetq_lane_f64(__rev2_906, __p3_906), __s0_906, __p1_906); \ 70885 __ret_906; \ 70886 }) 70887 #endif 70888 70889 #ifdef __LITTLE_ENDIAN__ 70890 __ai __attribute__((target("neon"))) uint16x8_t vmlal_high_u8(uint16x8_t __p0, uint8x16_t __p1, uint8x16_t __p2) { 70891 uint16x8_t __ret; 70892 __ret = vmlal_u8(__p0, vget_high_u8(__p1), vget_high_u8(__p2)); 70893 return __ret; 70894 } 70895 #else 70896 __ai __attribute__((target("neon"))) uint16x8_t vmlal_high_u8(uint16x8_t __p0, uint8x16_t __p1, uint8x16_t __p2) { 70897 uint16x8_t __ret; 70898 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 70899 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 70900 uint8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 70901 __ret = __noswap_vmlal_u8(__rev0, __noswap_vget_high_u8(__rev1), __noswap_vget_high_u8(__rev2)); 70902 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 70903 return __ret; 70904 } 70905 #endif 70906 70907 #ifdef __LITTLE_ENDIAN__ 70908 __ai __attribute__((target("neon"))) uint64x2_t vmlal_high_u32(uint64x2_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 70909 uint64x2_t __ret; 70910 __ret = vmlal_u32(__p0, vget_high_u32(__p1), vget_high_u32(__p2)); 70911 return __ret; 70912 } 70913 #else 70914 __ai __attribute__((target("neon"))) uint64x2_t vmlal_high_u32(uint64x2_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 70915 uint64x2_t __ret; 70916 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 70917 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 70918 uint32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 70919 __ret = __noswap_vmlal_u32(__rev0, __noswap_vget_high_u32(__rev1), __noswap_vget_high_u32(__rev2)); 70920 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 70921 return __ret; 70922 } 70923 #endif 70924 70925 #ifdef __LITTLE_ENDIAN__ 70926 __ai __attribute__((target("neon"))) uint32x4_t vmlal_high_u16(uint32x4_t __p0, uint16x8_t __p1, uint16x8_t __p2) { 70927 uint32x4_t __ret; 70928 __ret = vmlal_u16(__p0, vget_high_u16(__p1), vget_high_u16(__p2)); 70929 return __ret; 70930 } 70931 #else 70932 __ai __attribute__((target("neon"))) uint32x4_t vmlal_high_u16(uint32x4_t __p0, uint16x8_t __p1, uint16x8_t __p2) { 70933 uint32x4_t __ret; 70934 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 70935 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 70936 uint16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 70937 __ret = __noswap_vmlal_u16(__rev0, __noswap_vget_high_u16(__rev1), __noswap_vget_high_u16(__rev2)); 70938 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 70939 return __ret; 70940 } 70941 #endif 70942 70943 #ifdef __LITTLE_ENDIAN__ 70944 __ai __attribute__((target("neon"))) int16x8_t vmlal_high_s8(int16x8_t __p0, int8x16_t __p1, int8x16_t __p2) { 70945 int16x8_t __ret; 70946 __ret = vmlal_s8(__p0, vget_high_s8(__p1), vget_high_s8(__p2)); 70947 return __ret; 70948 } 70949 #else 70950 __ai __attribute__((target("neon"))) int16x8_t vmlal_high_s8(int16x8_t __p0, int8x16_t __p1, int8x16_t __p2) { 70951 int16x8_t __ret; 70952 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 70953 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 70954 int8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 70955 __ret = __noswap_vmlal_s8(__rev0, __noswap_vget_high_s8(__rev1), __noswap_vget_high_s8(__rev2)); 70956 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 70957 return __ret; 70958 } 70959 #endif 70960 70961 #ifdef __LITTLE_ENDIAN__ 70962 __ai __attribute__((target("neon"))) int64x2_t vmlal_high_s32(int64x2_t __p0, int32x4_t __p1, int32x4_t __p2) { 70963 int64x2_t __ret; 70964 __ret = vmlal_s32(__p0, vget_high_s32(__p1), vget_high_s32(__p2)); 70965 return __ret; 70966 } 70967 #else 70968 __ai __attribute__((target("neon"))) int64x2_t vmlal_high_s32(int64x2_t __p0, int32x4_t __p1, int32x4_t __p2) { 70969 int64x2_t __ret; 70970 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 70971 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 70972 int32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 70973 __ret = __noswap_vmlal_s32(__rev0, __noswap_vget_high_s32(__rev1), __noswap_vget_high_s32(__rev2)); 70974 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 70975 return __ret; 70976 } 70977 #endif 70978 70979 #ifdef __LITTLE_ENDIAN__ 70980 __ai __attribute__((target("neon"))) int32x4_t vmlal_high_s16(int32x4_t __p0, int16x8_t __p1, int16x8_t __p2) { 70981 int32x4_t __ret; 70982 __ret = vmlal_s16(__p0, vget_high_s16(__p1), vget_high_s16(__p2)); 70983 return __ret; 70984 } 70985 #else 70986 __ai __attribute__((target("neon"))) int32x4_t vmlal_high_s16(int32x4_t __p0, int16x8_t __p1, int16x8_t __p2) { 70987 int32x4_t __ret; 70988 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 70989 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 70990 int16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 70991 __ret = __noswap_vmlal_s16(__rev0, __noswap_vget_high_s16(__rev1), __noswap_vget_high_s16(__rev2)); 70992 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 70993 return __ret; 70994 } 70995 #endif 70996 70997 #ifdef __LITTLE_ENDIAN__ 70998 __ai __attribute__((target("neon"))) uint64x2_t vmlal_high_n_u32(uint64x2_t __p0, uint32x4_t __p1, uint32_t __p2) { 70999 uint64x2_t __ret; 71000 __ret = vmlal_n_u32(__p0, vget_high_u32(__p1), __p2); 71001 return __ret; 71002 } 71003 #else 71004 __ai __attribute__((target("neon"))) uint64x2_t vmlal_high_n_u32(uint64x2_t __p0, uint32x4_t __p1, uint32_t __p2) { 71005 uint64x2_t __ret; 71006 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 71007 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 71008 __ret = __noswap_vmlal_n_u32(__rev0, __noswap_vget_high_u32(__rev1), __p2); 71009 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 71010 return __ret; 71011 } 71012 #endif 71013 71014 #ifdef __LITTLE_ENDIAN__ 71015 __ai __attribute__((target("neon"))) uint32x4_t vmlal_high_n_u16(uint32x4_t __p0, uint16x8_t __p1, uint16_t __p2) { 71016 uint32x4_t __ret; 71017 __ret = vmlal_n_u16(__p0, vget_high_u16(__p1), __p2); 71018 return __ret; 71019 } 71020 #else 71021 __ai __attribute__((target("neon"))) uint32x4_t vmlal_high_n_u16(uint32x4_t __p0, uint16x8_t __p1, uint16_t __p2) { 71022 uint32x4_t __ret; 71023 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 71024 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 71025 __ret = __noswap_vmlal_n_u16(__rev0, __noswap_vget_high_u16(__rev1), __p2); 71026 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 71027 return __ret; 71028 } 71029 #endif 71030 71031 #ifdef __LITTLE_ENDIAN__ 71032 __ai __attribute__((target("neon"))) int64x2_t vmlal_high_n_s32(int64x2_t __p0, int32x4_t __p1, int32_t __p2) { 71033 int64x2_t __ret; 71034 __ret = vmlal_n_s32(__p0, vget_high_s32(__p1), __p2); 71035 return __ret; 71036 } 71037 #else 71038 __ai __attribute__((target("neon"))) int64x2_t vmlal_high_n_s32(int64x2_t __p0, int32x4_t __p1, int32_t __p2) { 71039 int64x2_t __ret; 71040 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 71041 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 71042 __ret = __noswap_vmlal_n_s32(__rev0, __noswap_vget_high_s32(__rev1), __p2); 71043 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 71044 return __ret; 71045 } 71046 #endif 71047 71048 #ifdef __LITTLE_ENDIAN__ 71049 __ai __attribute__((target("neon"))) int32x4_t vmlal_high_n_s16(int32x4_t __p0, int16x8_t __p1, int16_t __p2) { 71050 int32x4_t __ret; 71051 __ret = vmlal_n_s16(__p0, vget_high_s16(__p1), __p2); 71052 return __ret; 71053 } 71054 #else 71055 __ai __attribute__((target("neon"))) int32x4_t vmlal_high_n_s16(int32x4_t __p0, int16x8_t __p1, int16_t __p2) { 71056 int32x4_t __ret; 71057 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 71058 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 71059 __ret = __noswap_vmlal_n_s16(__rev0, __noswap_vget_high_s16(__rev1), __p2); 71060 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 71061 return __ret; 71062 } 71063 #endif 71064 71065 #ifdef __LITTLE_ENDIAN__ 71066 __ai __attribute__((target("neon"))) uint16x8_t vmlsl_high_u8(uint16x8_t __p0, uint8x16_t __p1, uint8x16_t __p2) { 71067 uint16x8_t __ret; 71068 __ret = vmlsl_u8(__p0, vget_high_u8(__p1), vget_high_u8(__p2)); 71069 return __ret; 71070 } 71071 #else 71072 __ai __attribute__((target("neon"))) uint16x8_t vmlsl_high_u8(uint16x8_t __p0, uint8x16_t __p1, uint8x16_t __p2) { 71073 uint16x8_t __ret; 71074 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 71075 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 71076 uint8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 71077 __ret = __noswap_vmlsl_u8(__rev0, __noswap_vget_high_u8(__rev1), __noswap_vget_high_u8(__rev2)); 71078 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 71079 return __ret; 71080 } 71081 #endif 71082 71083 #ifdef __LITTLE_ENDIAN__ 71084 __ai __attribute__((target("neon"))) uint64x2_t vmlsl_high_u32(uint64x2_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 71085 uint64x2_t __ret; 71086 __ret = vmlsl_u32(__p0, vget_high_u32(__p1), vget_high_u32(__p2)); 71087 return __ret; 71088 } 71089 #else 71090 __ai __attribute__((target("neon"))) uint64x2_t vmlsl_high_u32(uint64x2_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 71091 uint64x2_t __ret; 71092 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 71093 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 71094 uint32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 71095 __ret = __noswap_vmlsl_u32(__rev0, __noswap_vget_high_u32(__rev1), __noswap_vget_high_u32(__rev2)); 71096 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 71097 return __ret; 71098 } 71099 #endif 71100 71101 #ifdef __LITTLE_ENDIAN__ 71102 __ai __attribute__((target("neon"))) uint32x4_t vmlsl_high_u16(uint32x4_t __p0, uint16x8_t __p1, uint16x8_t __p2) { 71103 uint32x4_t __ret; 71104 __ret = vmlsl_u16(__p0, vget_high_u16(__p1), vget_high_u16(__p2)); 71105 return __ret; 71106 } 71107 #else 71108 __ai __attribute__((target("neon"))) uint32x4_t vmlsl_high_u16(uint32x4_t __p0, uint16x8_t __p1, uint16x8_t __p2) { 71109 uint32x4_t __ret; 71110 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 71111 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 71112 uint16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 71113 __ret = __noswap_vmlsl_u16(__rev0, __noswap_vget_high_u16(__rev1), __noswap_vget_high_u16(__rev2)); 71114 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 71115 return __ret; 71116 } 71117 #endif 71118 71119 #ifdef __LITTLE_ENDIAN__ 71120 __ai __attribute__((target("neon"))) int16x8_t vmlsl_high_s8(int16x8_t __p0, int8x16_t __p1, int8x16_t __p2) { 71121 int16x8_t __ret; 71122 __ret = vmlsl_s8(__p0, vget_high_s8(__p1), vget_high_s8(__p2)); 71123 return __ret; 71124 } 71125 #else 71126 __ai __attribute__((target("neon"))) int16x8_t vmlsl_high_s8(int16x8_t __p0, int8x16_t __p1, int8x16_t __p2) { 71127 int16x8_t __ret; 71128 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 71129 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 71130 int8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 71131 __ret = __noswap_vmlsl_s8(__rev0, __noswap_vget_high_s8(__rev1), __noswap_vget_high_s8(__rev2)); 71132 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 71133 return __ret; 71134 } 71135 #endif 71136 71137 #ifdef __LITTLE_ENDIAN__ 71138 __ai __attribute__((target("neon"))) int64x2_t vmlsl_high_s32(int64x2_t __p0, int32x4_t __p1, int32x4_t __p2) { 71139 int64x2_t __ret; 71140 __ret = vmlsl_s32(__p0, vget_high_s32(__p1), vget_high_s32(__p2)); 71141 return __ret; 71142 } 71143 #else 71144 __ai __attribute__((target("neon"))) int64x2_t vmlsl_high_s32(int64x2_t __p0, int32x4_t __p1, int32x4_t __p2) { 71145 int64x2_t __ret; 71146 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 71147 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 71148 int32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 71149 __ret = __noswap_vmlsl_s32(__rev0, __noswap_vget_high_s32(__rev1), __noswap_vget_high_s32(__rev2)); 71150 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 71151 return __ret; 71152 } 71153 #endif 71154 71155 #ifdef __LITTLE_ENDIAN__ 71156 __ai __attribute__((target("neon"))) int32x4_t vmlsl_high_s16(int32x4_t __p0, int16x8_t __p1, int16x8_t __p2) { 71157 int32x4_t __ret; 71158 __ret = vmlsl_s16(__p0, vget_high_s16(__p1), vget_high_s16(__p2)); 71159 return __ret; 71160 } 71161 #else 71162 __ai __attribute__((target("neon"))) int32x4_t vmlsl_high_s16(int32x4_t __p0, int16x8_t __p1, int16x8_t __p2) { 71163 int32x4_t __ret; 71164 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 71165 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 71166 int16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 71167 __ret = __noswap_vmlsl_s16(__rev0, __noswap_vget_high_s16(__rev1), __noswap_vget_high_s16(__rev2)); 71168 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 71169 return __ret; 71170 } 71171 #endif 71172 71173 #ifdef __LITTLE_ENDIAN__ 71174 __ai __attribute__((target("neon"))) uint64x2_t vmlsl_high_n_u32(uint64x2_t __p0, uint32x4_t __p1, uint32_t __p2) { 71175 uint64x2_t __ret; 71176 __ret = vmlsl_n_u32(__p0, vget_high_u32(__p1), __p2); 71177 return __ret; 71178 } 71179 #else 71180 __ai __attribute__((target("neon"))) uint64x2_t vmlsl_high_n_u32(uint64x2_t __p0, uint32x4_t __p1, uint32_t __p2) { 71181 uint64x2_t __ret; 71182 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 71183 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 71184 __ret = __noswap_vmlsl_n_u32(__rev0, __noswap_vget_high_u32(__rev1), __p2); 71185 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 71186 return __ret; 71187 } 71188 #endif 71189 71190 #ifdef __LITTLE_ENDIAN__ 71191 __ai __attribute__((target("neon"))) uint32x4_t vmlsl_high_n_u16(uint32x4_t __p0, uint16x8_t __p1, uint16_t __p2) { 71192 uint32x4_t __ret; 71193 __ret = vmlsl_n_u16(__p0, vget_high_u16(__p1), __p2); 71194 return __ret; 71195 } 71196 #else 71197 __ai __attribute__((target("neon"))) uint32x4_t vmlsl_high_n_u16(uint32x4_t __p0, uint16x8_t __p1, uint16_t __p2) { 71198 uint32x4_t __ret; 71199 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 71200 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 71201 __ret = __noswap_vmlsl_n_u16(__rev0, __noswap_vget_high_u16(__rev1), __p2); 71202 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 71203 return __ret; 71204 } 71205 #endif 71206 71207 #ifdef __LITTLE_ENDIAN__ 71208 __ai __attribute__((target("neon"))) int64x2_t vmlsl_high_n_s32(int64x2_t __p0, int32x4_t __p1, int32_t __p2) { 71209 int64x2_t __ret; 71210 __ret = vmlsl_n_s32(__p0, vget_high_s32(__p1), __p2); 71211 return __ret; 71212 } 71213 #else 71214 __ai __attribute__((target("neon"))) int64x2_t vmlsl_high_n_s32(int64x2_t __p0, int32x4_t __p1, int32_t __p2) { 71215 int64x2_t __ret; 71216 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 71217 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 71218 __ret = __noswap_vmlsl_n_s32(__rev0, __noswap_vget_high_s32(__rev1), __p2); 71219 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 71220 return __ret; 71221 } 71222 #endif 71223 71224 #ifdef __LITTLE_ENDIAN__ 71225 __ai __attribute__((target("neon"))) int32x4_t vmlsl_high_n_s16(int32x4_t __p0, int16x8_t __p1, int16_t __p2) { 71226 int32x4_t __ret; 71227 __ret = vmlsl_n_s16(__p0, vget_high_s16(__p1), __p2); 71228 return __ret; 71229 } 71230 #else 71231 __ai __attribute__((target("neon"))) int32x4_t vmlsl_high_n_s16(int32x4_t __p0, int16x8_t __p1, int16_t __p2) { 71232 int32x4_t __ret; 71233 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 71234 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 71235 __ret = __noswap_vmlsl_n_s16(__rev0, __noswap_vget_high_s16(__rev1), __p2); 71236 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 71237 return __ret; 71238 } 71239 #endif 71240 71241 #define vmulx_lane_f64(__p0_907, __p1_907, __p2_907) __extension__ ({ \ 71242 float64x1_t __ret_907; \ 71243 float64x1_t __s0_907 = __p0_907; \ 71244 float64x1_t __s1_907 = __p1_907; \ 71245 float64_t __x_907 = vget_lane_f64(__s0_907, 0); \ 71246 float64_t __y_907 = vget_lane_f64(__s1_907, __p2_907); \ 71247 float64_t __z_907 = vmulxd_f64(__x_907, __y_907); \ 71248 __ret_907 = vset_lane_f64(__z_907, __s0_907, __p2_907); \ 71249 __ret_907; \ 71250 }) 71251 #ifdef __LITTLE_ENDIAN__ 71252 #define vmulx_laneq_f64(__p0_908, __p1_908, __p2_908) __extension__ ({ \ 71253 float64x1_t __ret_908; \ 71254 float64x1_t __s0_908 = __p0_908; \ 71255 float64x2_t __s1_908 = __p1_908; \ 71256 float64_t __x_908 = vget_lane_f64(__s0_908, 0); \ 71257 float64_t __y_908 = vgetq_lane_f64(__s1_908, __p2_908); \ 71258 float64_t __z_908 = vmulxd_f64(__x_908, __y_908); \ 71259 __ret_908 = vset_lane_f64(__z_908, __s0_908, 0); \ 71260 __ret_908; \ 71261 }) 71262 #else 71263 #define vmulx_laneq_f64(__p0_909, __p1_909, __p2_909) __extension__ ({ \ 71264 float64x1_t __ret_909; \ 71265 float64x1_t __s0_909 = __p0_909; \ 71266 float64x2_t __s1_909 = __p1_909; \ 71267 float64x2_t __rev1_909; __rev1_909 = __builtin_shufflevector(__s1_909, __s1_909, 1, 0); \ 71268 float64_t __x_909 = vget_lane_f64(__s0_909, 0); \ 71269 float64_t __y_909 = __noswap_vgetq_lane_f64(__rev1_909, __p2_909); \ 71270 float64_t __z_909 = vmulxd_f64(__x_909, __y_909); \ 71271 __ret_909 = vset_lane_f64(__z_909, __s0_909, 0); \ 71272 __ret_909; \ 71273 }) 71274 #endif 71275 71276 #endif 71277 #ifdef __LITTLE_ENDIAN__ 71278 __ai __attribute__((target("neon"))) uint16x8_t vabal_u8(uint16x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) { 71279 uint16x8_t __ret; 71280 __ret = __p0 + vabdl_u8(__p1, __p2); 71281 return __ret; 71282 } 71283 #else 71284 __ai __attribute__((target("neon"))) uint16x8_t vabal_u8(uint16x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) { 71285 uint16x8_t __ret; 71286 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 71287 uint8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 71288 uint8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 71289 __ret = __rev0 + __noswap_vabdl_u8(__rev1, __rev2); 71290 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 71291 return __ret; 71292 } 71293 __ai __attribute__((target("neon"))) uint16x8_t __noswap_vabal_u8(uint16x8_t __p0, uint8x8_t __p1, uint8x8_t __p2) { 71294 uint16x8_t __ret; 71295 __ret = __p0 + __noswap_vabdl_u8(__p1, __p2); 71296 return __ret; 71297 } 71298 #endif 71299 71300 #ifdef __LITTLE_ENDIAN__ 71301 __ai __attribute__((target("neon"))) uint64x2_t vabal_u32(uint64x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) { 71302 uint64x2_t __ret; 71303 __ret = __p0 + vabdl_u32(__p1, __p2); 71304 return __ret; 71305 } 71306 #else 71307 __ai __attribute__((target("neon"))) uint64x2_t vabal_u32(uint64x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) { 71308 uint64x2_t __ret; 71309 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 71310 uint32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 71311 uint32x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 71312 __ret = __rev0 + __noswap_vabdl_u32(__rev1, __rev2); 71313 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 71314 return __ret; 71315 } 71316 __ai __attribute__((target("neon"))) uint64x2_t __noswap_vabal_u32(uint64x2_t __p0, uint32x2_t __p1, uint32x2_t __p2) { 71317 uint64x2_t __ret; 71318 __ret = __p0 + __noswap_vabdl_u32(__p1, __p2); 71319 return __ret; 71320 } 71321 #endif 71322 71323 #ifdef __LITTLE_ENDIAN__ 71324 __ai __attribute__((target("neon"))) uint32x4_t vabal_u16(uint32x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) { 71325 uint32x4_t __ret; 71326 __ret = __p0 + vabdl_u16(__p1, __p2); 71327 return __ret; 71328 } 71329 #else 71330 __ai __attribute__((target("neon"))) uint32x4_t vabal_u16(uint32x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) { 71331 uint32x4_t __ret; 71332 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 71333 uint16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 71334 uint16x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 71335 __ret = __rev0 + __noswap_vabdl_u16(__rev1, __rev2); 71336 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 71337 return __ret; 71338 } 71339 __ai __attribute__((target("neon"))) uint32x4_t __noswap_vabal_u16(uint32x4_t __p0, uint16x4_t __p1, uint16x4_t __p2) { 71340 uint32x4_t __ret; 71341 __ret = __p0 + __noswap_vabdl_u16(__p1, __p2); 71342 return __ret; 71343 } 71344 #endif 71345 71346 #ifdef __LITTLE_ENDIAN__ 71347 __ai __attribute__((target("neon"))) int16x8_t vabal_s8(int16x8_t __p0, int8x8_t __p1, int8x8_t __p2) { 71348 int16x8_t __ret; 71349 __ret = __p0 + vabdl_s8(__p1, __p2); 71350 return __ret; 71351 } 71352 #else 71353 __ai __attribute__((target("neon"))) int16x8_t vabal_s8(int16x8_t __p0, int8x8_t __p1, int8x8_t __p2) { 71354 int16x8_t __ret; 71355 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 71356 int8x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 71357 int8x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 71358 __ret = __rev0 + __noswap_vabdl_s8(__rev1, __rev2); 71359 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 71360 return __ret; 71361 } 71362 __ai __attribute__((target("neon"))) int16x8_t __noswap_vabal_s8(int16x8_t __p0, int8x8_t __p1, int8x8_t __p2) { 71363 int16x8_t __ret; 71364 __ret = __p0 + __noswap_vabdl_s8(__p1, __p2); 71365 return __ret; 71366 } 71367 #endif 71368 71369 #ifdef __LITTLE_ENDIAN__ 71370 __ai __attribute__((target("neon"))) int64x2_t vabal_s32(int64x2_t __p0, int32x2_t __p1, int32x2_t __p2) { 71371 int64x2_t __ret; 71372 __ret = __p0 + vabdl_s32(__p1, __p2); 71373 return __ret; 71374 } 71375 #else 71376 __ai __attribute__((target("neon"))) int64x2_t vabal_s32(int64x2_t __p0, int32x2_t __p1, int32x2_t __p2) { 71377 int64x2_t __ret; 71378 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 71379 int32x2_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 1, 0); 71380 int32x2_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 1, 0); 71381 __ret = __rev0 + __noswap_vabdl_s32(__rev1, __rev2); 71382 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 71383 return __ret; 71384 } 71385 __ai __attribute__((target("neon"))) int64x2_t __noswap_vabal_s32(int64x2_t __p0, int32x2_t __p1, int32x2_t __p2) { 71386 int64x2_t __ret; 71387 __ret = __p0 + __noswap_vabdl_s32(__p1, __p2); 71388 return __ret; 71389 } 71390 #endif 71391 71392 #ifdef __LITTLE_ENDIAN__ 71393 __ai __attribute__((target("neon"))) int32x4_t vabal_s16(int32x4_t __p0, int16x4_t __p1, int16x4_t __p2) { 71394 int32x4_t __ret; 71395 __ret = __p0 + vabdl_s16(__p1, __p2); 71396 return __ret; 71397 } 71398 #else 71399 __ai __attribute__((target("neon"))) int32x4_t vabal_s16(int32x4_t __p0, int16x4_t __p1, int16x4_t __p2) { 71400 int32x4_t __ret; 71401 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 71402 int16x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 71403 int16x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 71404 __ret = __rev0 + __noswap_vabdl_s16(__rev1, __rev2); 71405 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 71406 return __ret; 71407 } 71408 __ai __attribute__((target("neon"))) int32x4_t __noswap_vabal_s16(int32x4_t __p0, int16x4_t __p1, int16x4_t __p2) { 71409 int32x4_t __ret; 71410 __ret = __p0 + __noswap_vabdl_s16(__p1, __p2); 71411 return __ret; 71412 } 71413 #endif 71414 71415 #if defined(__aarch64__) || defined(__arm64ec__) 71416 #ifdef __LITTLE_ENDIAN__ 71417 __ai __attribute__((target("neon"))) uint16x8_t vabal_high_u8(uint16x8_t __p0, uint8x16_t __p1, uint8x16_t __p2) { 71418 uint16x8_t __ret; 71419 __ret = vabal_u8(__p0, vget_high_u8(__p1), vget_high_u8(__p2)); 71420 return __ret; 71421 } 71422 #else 71423 __ai __attribute__((target("neon"))) uint16x8_t vabal_high_u8(uint16x8_t __p0, uint8x16_t __p1, uint8x16_t __p2) { 71424 uint16x8_t __ret; 71425 uint16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 71426 uint8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 71427 uint8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 71428 __ret = __noswap_vabal_u8(__rev0, __noswap_vget_high_u8(__rev1), __noswap_vget_high_u8(__rev2)); 71429 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 71430 return __ret; 71431 } 71432 #endif 71433 71434 #ifdef __LITTLE_ENDIAN__ 71435 __ai __attribute__((target("neon"))) uint64x2_t vabal_high_u32(uint64x2_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 71436 uint64x2_t __ret; 71437 __ret = vabal_u32(__p0, vget_high_u32(__p1), vget_high_u32(__p2)); 71438 return __ret; 71439 } 71440 #else 71441 __ai __attribute__((target("neon"))) uint64x2_t vabal_high_u32(uint64x2_t __p0, uint32x4_t __p1, uint32x4_t __p2) { 71442 uint64x2_t __ret; 71443 uint64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 71444 uint32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 71445 uint32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 71446 __ret = __noswap_vabal_u32(__rev0, __noswap_vget_high_u32(__rev1), __noswap_vget_high_u32(__rev2)); 71447 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 71448 return __ret; 71449 } 71450 #endif 71451 71452 #ifdef __LITTLE_ENDIAN__ 71453 __ai __attribute__((target("neon"))) uint32x4_t vabal_high_u16(uint32x4_t __p0, uint16x8_t __p1, uint16x8_t __p2) { 71454 uint32x4_t __ret; 71455 __ret = vabal_u16(__p0, vget_high_u16(__p1), vget_high_u16(__p2)); 71456 return __ret; 71457 } 71458 #else 71459 __ai __attribute__((target("neon"))) uint32x4_t vabal_high_u16(uint32x4_t __p0, uint16x8_t __p1, uint16x8_t __p2) { 71460 uint32x4_t __ret; 71461 uint32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 71462 uint16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 71463 uint16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 71464 __ret = __noswap_vabal_u16(__rev0, __noswap_vget_high_u16(__rev1), __noswap_vget_high_u16(__rev2)); 71465 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 71466 return __ret; 71467 } 71468 #endif 71469 71470 #ifdef __LITTLE_ENDIAN__ 71471 __ai __attribute__((target("neon"))) int16x8_t vabal_high_s8(int16x8_t __p0, int8x16_t __p1, int8x16_t __p2) { 71472 int16x8_t __ret; 71473 __ret = vabal_s8(__p0, vget_high_s8(__p1), vget_high_s8(__p2)); 71474 return __ret; 71475 } 71476 #else 71477 __ai __attribute__((target("neon"))) int16x8_t vabal_high_s8(int16x8_t __p0, int8x16_t __p1, int8x16_t __p2) { 71478 int16x8_t __ret; 71479 int16x8_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 7, 6, 5, 4, 3, 2, 1, 0); 71480 int8x16_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 71481 int8x16_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0); 71482 __ret = __noswap_vabal_s8(__rev0, __noswap_vget_high_s8(__rev1), __noswap_vget_high_s8(__rev2)); 71483 __ret = __builtin_shufflevector(__ret, __ret, 7, 6, 5, 4, 3, 2, 1, 0); 71484 return __ret; 71485 } 71486 #endif 71487 71488 #ifdef __LITTLE_ENDIAN__ 71489 __ai __attribute__((target("neon"))) int64x2_t vabal_high_s32(int64x2_t __p0, int32x4_t __p1, int32x4_t __p2) { 71490 int64x2_t __ret; 71491 __ret = vabal_s32(__p0, vget_high_s32(__p1), vget_high_s32(__p2)); 71492 return __ret; 71493 } 71494 #else 71495 __ai __attribute__((target("neon"))) int64x2_t vabal_high_s32(int64x2_t __p0, int32x4_t __p1, int32x4_t __p2) { 71496 int64x2_t __ret; 71497 int64x2_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 1, 0); 71498 int32x4_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 3, 2, 1, 0); 71499 int32x4_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 3, 2, 1, 0); 71500 __ret = __noswap_vabal_s32(__rev0, __noswap_vget_high_s32(__rev1), __noswap_vget_high_s32(__rev2)); 71501 __ret = __builtin_shufflevector(__ret, __ret, 1, 0); 71502 return __ret; 71503 } 71504 #endif 71505 71506 #ifdef __LITTLE_ENDIAN__ 71507 __ai __attribute__((target("neon"))) int32x4_t vabal_high_s16(int32x4_t __p0, int16x8_t __p1, int16x8_t __p2) { 71508 int32x4_t __ret; 71509 __ret = vabal_s16(__p0, vget_high_s16(__p1), vget_high_s16(__p2)); 71510 return __ret; 71511 } 71512 #else 71513 __ai __attribute__((target("neon"))) int32x4_t vabal_high_s16(int32x4_t __p0, int16x8_t __p1, int16x8_t __p2) { 71514 int32x4_t __ret; 71515 int32x4_t __rev0; __rev0 = __builtin_shufflevector(__p0, __p0, 3, 2, 1, 0); 71516 int16x8_t __rev1; __rev1 = __builtin_shufflevector(__p1, __p1, 7, 6, 5, 4, 3, 2, 1, 0); 71517 int16x8_t __rev2; __rev2 = __builtin_shufflevector(__p2, __p2, 7, 6, 5, 4, 3, 2, 1, 0); 71518 __ret = __noswap_vabal_s16(__rev0, __noswap_vget_high_s16(__rev1), __noswap_vget_high_s16(__rev2)); 71519 __ret = __builtin_shufflevector(__ret, __ret, 3, 2, 1, 0); 71520 return __ret; 71521 } 71522 #endif 71523 71524 #endif 71525 71526 #undef __ai 71527 71528 #endif /* if !defined(__ARM_NEON) */ 71529 #endif /* ifndef __ARM_FP */